program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "5.33.5"}, {"coremlc-version", "1877.40.3"}})] { func main(tensor cache_length, tensor decoder_key_padding_mask, tensor encoder_output_embeds, tensor input_ids, tensor key_cache, tensor kv_cache_update_mask, tensor value_cache) { tensor var_80_axis_0 = const()[name = tensor("op_80_axis_0"), val = tensor(0)]; tensor var_80_batch_dims_0 = const()[name = tensor("op_80_batch_dims_0"), val = tensor(0)]; tensor var_80_validate_indices_0 = const()[name = tensor("op_80_validate_indices_0"), val = tensor(false)]; tensor embed_tokens_weight_to_fp16 = const()[name = tensor("embed_tokens_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor var_80_cast_fp16 = gather(axis = var_80_axis_0, batch_dims = var_80_batch_dims_0, indices = input_ids, validate_indices = var_80_validate_indices_0, x = embed_tokens_weight_to_fp16)[name = tensor("op_80_cast_fp16")]; tensor var_84_axis_0 = const()[name = tensor("op_84_axis_0"), val = tensor(0)]; tensor var_84_batch_dims_0 = const()[name = tensor("op_84_batch_dims_0"), val = tensor(0)]; tensor var_84_validate_indices_0 = const()[name = tensor("op_84_validate_indices_0"), val = tensor(false)]; tensor embed_positions_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(132777088))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(133350592))), name = tensor("embed_positions_weight_to_fp16_palettized"), shape = tensor([448, 1280])]; tensor cache_length_to_int16_dtype_0 = const()[name = tensor("cache_length_to_int16_dtype_0"), val = tensor("int16")]; tensor cast_0 = cast(dtype = cache_length_to_int16_dtype_0, x = cache_length)[name = tensor("cast_0")]; tensor var_84_cast_fp16_cast_int16 = gather(axis = var_84_axis_0, batch_dims = var_84_batch_dims_0, indices = cast_0, validate_indices = var_84_validate_indices_0, x = embed_positions_weight_to_fp16_palettized)[name = tensor("op_84_cast_fp16_cast_int16")]; tensor hidden_states_1_cast_fp16 = add(x = var_80_cast_fp16, y = var_84_cast_fp16_cast_int16)[name = tensor("hidden_states_1_cast_fp16")]; tensor var_98_axes_0 = const()[name = tensor("op_98_axes_0"), val = tensor([2])]; tensor var_98_cast_fp16 = expand_dims(axes = var_98_axes_0, x = hidden_states_1_cast_fp16)[name = tensor("op_98_cast_fp16")]; tensor inputs_1_axes_0 = const()[name = tensor("inputs_1_axes_0"), val = tensor([3])]; tensor inputs_1_cast_fp16 = expand_dims(axes = inputs_1_axes_0, x = var_98_cast_fp16)[name = tensor("inputs_1_cast_fp16")]; tensor tile_0 = const()[name = tensor("tile_0"), val = tensor([1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280])]; tensor var_103_axis_0 = const()[name = tensor("op_103_axis_0"), val = tensor(1)]; tensor var_103_cast_fp16_0, tensor var_103_cast_fp16_1, tensor var_103_cast_fp16_2, tensor var_103_cast_fp16_3, tensor var_103_cast_fp16_4, tensor var_103_cast_fp16_5, tensor var_103_cast_fp16_6, tensor var_103_cast_fp16_7, tensor var_103_cast_fp16_8, tensor var_103_cast_fp16_9, tensor var_103_cast_fp16_10, tensor var_103_cast_fp16_11, tensor var_103_cast_fp16_12, tensor var_103_cast_fp16_13, tensor var_103_cast_fp16_14, tensor var_103_cast_fp16_15, tensor var_103_cast_fp16_16, tensor var_103_cast_fp16_17, tensor var_103_cast_fp16_18, tensor var_103_cast_fp16_19, tensor var_103_cast_fp16_20, tensor var_103_cast_fp16_21, tensor var_103_cast_fp16_22, tensor var_103_cast_fp16_23, tensor var_103_cast_fp16_24, tensor var_103_cast_fp16_25, tensor var_103_cast_fp16_26, tensor var_103_cast_fp16_27, tensor var_103_cast_fp16_28, tensor var_103_cast_fp16_29, tensor var_103_cast_fp16_30, tensor var_103_cast_fp16_31 = split(axis = var_103_axis_0, split_sizes = tile_0, x = key_cache)[name = tensor("op_103_cast_fp16")]; tensor tile_1 = const()[name = tensor("tile_1"), val = tensor([1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280, 1280])]; tensor var_138_axis_0 = const()[name = tensor("op_138_axis_0"), val = tensor(1)]; tensor var_138_cast_fp16_0, tensor var_138_cast_fp16_1, tensor var_138_cast_fp16_2, tensor var_138_cast_fp16_3, tensor var_138_cast_fp16_4, tensor var_138_cast_fp16_5, tensor var_138_cast_fp16_6, tensor var_138_cast_fp16_7, tensor var_138_cast_fp16_8, tensor var_138_cast_fp16_9, tensor var_138_cast_fp16_10, tensor var_138_cast_fp16_11, tensor var_138_cast_fp16_12, tensor var_138_cast_fp16_13, tensor var_138_cast_fp16_14, tensor var_138_cast_fp16_15, tensor var_138_cast_fp16_16, tensor var_138_cast_fp16_17, tensor var_138_cast_fp16_18, tensor var_138_cast_fp16_19, tensor var_138_cast_fp16_20, tensor var_138_cast_fp16_21, tensor var_138_cast_fp16_22, tensor var_138_cast_fp16_23, tensor var_138_cast_fp16_24, tensor var_138_cast_fp16_25, tensor var_138_cast_fp16_26, tensor var_138_cast_fp16_27, tensor var_138_cast_fp16_28, tensor var_138_cast_fp16_29, tensor var_138_cast_fp16_30, tensor var_138_cast_fp16_31 = split(axis = var_138_axis_0, split_sizes = tile_1, x = value_cache)[name = tensor("op_138_cast_fp16")]; tensor var_176 = const()[name = tensor("op_176"), val = tensor(3)]; tensor var_183 = const()[name = tensor("op_183"), val = tensor(1)]; tensor var_184 = const()[name = tensor("op_184"), val = tensor(true)]; tensor var_196 = const()[name = tensor("op_196"), val = tensor([1])]; tensor channels_mean_1_cast_fp16 = reduce_mean(axes = var_196, keep_dims = var_184, x = inputs_1_cast_fp16)[name = tensor("channels_mean_1_cast_fp16")]; tensor zero_mean_1_cast_fp16 = sub(x = inputs_1_cast_fp16, y = channels_mean_1_cast_fp16)[name = tensor("zero_mean_1_cast_fp16")]; tensor zero_mean_sq_1_cast_fp16 = mul(x = zero_mean_1_cast_fp16, y = zero_mean_1_cast_fp16)[name = tensor("zero_mean_sq_1_cast_fp16")]; tensor var_200 = const()[name = tensor("op_200"), val = tensor([1])]; tensor var_201_cast_fp16 = reduce_mean(axes = var_200, keep_dims = var_184, x = zero_mean_sq_1_cast_fp16)[name = tensor("op_201_cast_fp16")]; tensor var_202_to_fp16 = const()[name = tensor("op_202_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_203_cast_fp16 = add(x = var_201_cast_fp16, y = var_202_to_fp16)[name = tensor("op_203_cast_fp16")]; tensor denom_1_epsilon_0 = const()[name = tensor("denom_1_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_1_cast_fp16 = rsqrt(epsilon = denom_1_epsilon_0, x = var_203_cast_fp16)[name = tensor("denom_1_cast_fp16")]; tensor out_1_cast_fp16 = mul(x = zero_mean_1_cast_fp16, y = denom_1_cast_fp16)[name = tensor("out_1_cast_fp16")]; tensor obj_1_mean_0_to_fp16 = const()[name = tensor("obj_1_mean_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(133351168)))]; tensor obj_1_variance_0_to_fp16 = const()[name = tensor("obj_1_variance_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(133353792)))]; tensor obj_1_gamma_0_to_fp16 = const()[name = tensor("obj_1_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(133356416)))]; tensor obj_1_beta_0_to_fp16 = const()[name = tensor("obj_1_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(133359040)))]; tensor obj_1_epsilon_0_to_fp16 = const()[name = tensor("obj_1_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_1_cast_fp16 = batch_norm(beta = obj_1_beta_0_to_fp16, epsilon = obj_1_epsilon_0_to_fp16, gamma = obj_1_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_1_cast_fp16)[name = tensor("obj_1_cast_fp16")]; tensor var_218 = const()[name = tensor("op_218"), val = tensor([1, 1])]; tensor var_220 = const()[name = tensor("op_220"), val = tensor([1, 1])]; tensor query_1_pad_type_0 = const()[name = tensor("query_1_pad_type_0"), val = tensor("custom")]; tensor query_1_pad_0 = const()[name = tensor("query_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_0_self_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_0_self_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(133361664)))]; tensor layers_0_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_0_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(136638528)))]; tensor query_1_cast_fp16 = conv(bias = layers_0_self_attn_q_proj_bias_to_fp16, dilations = var_220, groups = var_183, pad = query_1_pad_0, pad_type = query_1_pad_type_0, strides = var_218, weight = layers_0_self_attn_q_proj_weight_to_fp16, x = obj_1_cast_fp16)[name = tensor("query_1_cast_fp16")]; tensor var_224 = const()[name = tensor("op_224"), val = tensor([1, 1])]; tensor var_226 = const()[name = tensor("op_226"), val = tensor([1, 1])]; tensor current_key_1_pad_type_0 = const()[name = tensor("current_key_1_pad_type_0"), val = tensor("custom")]; tensor current_key_1_pad_0 = const()[name = tensor("current_key_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_0_self_attn_k_proj_weight_to_fp16 = const()[name = tensor("layers_0_self_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(136641152)))]; tensor current_key_1_cast_fp16 = conv(dilations = var_226, groups = var_183, pad = current_key_1_pad_0, pad_type = current_key_1_pad_type_0, strides = var_224, weight = layers_0_self_attn_k_proj_weight_to_fp16, x = obj_1_cast_fp16)[name = tensor("current_key_1_cast_fp16")]; tensor var_231 = const()[name = tensor("op_231"), val = tensor([1, 1])]; tensor var_233 = const()[name = tensor("op_233"), val = tensor([1, 1])]; tensor current_value_1_pad_type_0 = const()[name = tensor("current_value_1_pad_type_0"), val = tensor("custom")]; tensor current_value_1_pad_0 = const()[name = tensor("current_value_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_0_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139918016))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141146880))), name = tensor("layers_0_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_0_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_0_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141147072)))]; tensor current_value_1_cast_fp16 = conv(bias = layers_0_self_attn_v_proj_bias_to_fp16, dilations = var_233, groups = var_183, pad = current_value_1_pad_0, pad_type = current_value_1_pad_type_0, strides = var_231, weight = layers_0_self_attn_v_proj_weight_to_fp16_palettized, x = obj_1_cast_fp16)[name = tensor("current_value_1_cast_fp16")]; tensor var_237_axes_0 = const()[name = tensor("op_237_axes_0"), val = tensor([1])]; tensor var_237_cast_fp16 = expand_dims(axes = var_237_axes_0, x = kv_cache_update_mask)[name = tensor("op_237_cast_fp16")]; tensor var_238_axes_0 = const()[name = tensor("op_238_axes_0"), val = tensor([2])]; tensor var_238_cast_fp16 = expand_dims(axes = var_238_axes_0, x = var_237_cast_fp16)[name = tensor("op_238_cast_fp16")]; tensor var_240_cast_fp16 = mul(x = current_key_1_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_240_cast_fp16")]; tensor var_177_to_fp16 = const()[name = tensor("op_177_to_fp16"), val = tensor(0x1p+0)]; tensor var_241_cast_fp16 = sub(x = var_177_to_fp16, y = var_238_cast_fp16)[name = tensor("op_241_cast_fp16")]; tensor var_242_cast_fp16 = mul(x = var_103_cast_fp16_0, y = var_241_cast_fp16)[name = tensor("op_242_cast_fp16")]; tensor key_1_cast_fp16 = add(x = var_240_cast_fp16, y = var_242_cast_fp16)[name = tensor("key_1_cast_fp16")]; tensor var_244_cast_fp16 = mul(x = current_value_1_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_244_cast_fp16")]; tensor var_246_cast_fp16 = mul(x = var_138_cast_fp16_0, y = var_241_cast_fp16)[name = tensor("op_246_cast_fp16")]; tensor value_1_cast_fp16 = add(x = var_244_cast_fp16, y = var_246_cast_fp16)[name = tensor("value_1_cast_fp16")]; tensor var_249 = const()[name = tensor("op_249"), val = tensor([1, 20, 64, -1])]; tensor var_250_cast_fp16 = reshape(shape = var_249, x = query_1_cast_fp16)[name = tensor("op_250_cast_fp16")]; tensor var_251_to_fp16 = const()[name = tensor("op_251_to_fp16"), val = tensor(0x1p-3)]; tensor var_252_cast_fp16 = mul(x = var_250_cast_fp16, y = var_251_to_fp16)[name = tensor("op_252_cast_fp16")]; tensor var_253 = const()[name = tensor("op_253"), val = tensor([1, 20, 64, -1])]; tensor var_254_cast_fp16 = reshape(shape = var_253, x = key_1_cast_fp16)[name = tensor("op_254_cast_fp16")]; tensor mh_w_1_transpose_x_0 = const()[name = tensor("mh_w_1_transpose_x_0"), val = tensor(true)]; tensor mh_w_1_transpose_y_0 = const()[name = tensor("mh_w_1_transpose_y_0"), val = tensor(false)]; tensor mh_w_1_cast_fp16 = matmul(transpose_x = mh_w_1_transpose_x_0, transpose_y = mh_w_1_transpose_y_0, x = var_252_cast_fp16, y = var_254_cast_fp16)[name = tensor("mh_w_1_cast_fp16")]; tensor var_258_axes_0 = const()[name = tensor("op_258_axes_0"), val = tensor([1])]; tensor var_258_cast_fp16 = expand_dims(axes = var_258_axes_0, x = decoder_key_padding_mask)[name = tensor("op_258_cast_fp16")]; tensor var_259_axes_0 = const()[name = tensor("op_259_axes_0"), val = tensor([2])]; tensor var_259_cast_fp16 = expand_dims(axes = var_259_axes_0, x = var_258_cast_fp16)[name = tensor("op_259_cast_fp16")]; tensor mh_w_3_cast_fp16 = add(x = mh_w_1_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_3_cast_fp16")]; tensor var_262_cast_fp16 = softmax(axis = var_176, x = mh_w_3_cast_fp16)[name = tensor("op_262_cast_fp16")]; tensor var_263 = const()[name = tensor("op_263"), val = tensor([1, 20, 64, -1])]; tensor var_264_cast_fp16 = reshape(shape = var_263, x = value_1_cast_fp16)[name = tensor("op_264_cast_fp16")]; tensor attn_1_transpose_x_0 = const()[name = tensor("attn_1_transpose_x_0"), val = tensor(false)]; tensor attn_1_transpose_y_0 = const()[name = tensor("attn_1_transpose_y_0"), val = tensor(true)]; tensor attn_1_cast_fp16 = matmul(transpose_x = attn_1_transpose_x_0, transpose_y = attn_1_transpose_y_0, x = var_264_cast_fp16, y = var_262_cast_fp16)[name = tensor("attn_1_cast_fp16")]; tensor var_267 = const()[name = tensor("op_267"), val = tensor([1, 1280, 1, -1])]; tensor input_1_cast_fp16 = reshape(shape = var_267, x = attn_1_cast_fp16)[name = tensor("input_1_cast_fp16")]; tensor var_271 = const()[name = tensor("op_271"), val = tensor([1, 1])]; tensor var_273 = const()[name = tensor("op_273"), val = tensor([1, 1])]; tensor obj_7_pad_type_0 = const()[name = tensor("obj_7_pad_type_0"), val = tensor("custom")]; tensor obj_7_pad_0 = const()[name = tensor("obj_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_0_self_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_0_self_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(141149696)))]; tensor layers_0_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_0_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144426560)))]; tensor obj_7_cast_fp16 = conv(bias = layers_0_self_attn_o_proj_bias_to_fp16, dilations = var_273, groups = var_183, pad = obj_7_pad_0, pad_type = obj_7_pad_type_0, strides = var_271, weight = layers_0_self_attn_o_proj_weight_to_fp16, x = input_1_cast_fp16)[name = tensor("obj_7_cast_fp16")]; tensor inputs_3_cast_fp16 = add(x = inputs_1_cast_fp16, y = obj_7_cast_fp16)[name = tensor("inputs_3_cast_fp16")]; tensor var_283 = const()[name = tensor("op_283"), val = tensor([1])]; tensor channels_mean_3_cast_fp16 = reduce_mean(axes = var_283, keep_dims = var_184, x = inputs_3_cast_fp16)[name = tensor("channels_mean_3_cast_fp16")]; tensor zero_mean_3_cast_fp16 = sub(x = inputs_3_cast_fp16, y = channels_mean_3_cast_fp16)[name = tensor("zero_mean_3_cast_fp16")]; tensor zero_mean_sq_3_cast_fp16 = mul(x = zero_mean_3_cast_fp16, y = zero_mean_3_cast_fp16)[name = tensor("zero_mean_sq_3_cast_fp16")]; tensor var_287 = const()[name = tensor("op_287"), val = tensor([1])]; tensor var_288_cast_fp16 = reduce_mean(axes = var_287, keep_dims = var_184, x = zero_mean_sq_3_cast_fp16)[name = tensor("op_288_cast_fp16")]; tensor var_289_to_fp16 = const()[name = tensor("op_289_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_290_cast_fp16 = add(x = var_288_cast_fp16, y = var_289_to_fp16)[name = tensor("op_290_cast_fp16")]; tensor denom_3_epsilon_0 = const()[name = tensor("denom_3_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_3_cast_fp16 = rsqrt(epsilon = denom_3_epsilon_0, x = var_290_cast_fp16)[name = tensor("denom_3_cast_fp16")]; tensor out_3_cast_fp16 = mul(x = zero_mean_3_cast_fp16, y = denom_3_cast_fp16)[name = tensor("out_3_cast_fp16")]; tensor obj_9_gamma_0_to_fp16 = const()[name = tensor("obj_9_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144429184)))]; tensor obj_9_beta_0_to_fp16 = const()[name = tensor("obj_9_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144431808)))]; tensor obj_9_epsilon_0_to_fp16 = const()[name = tensor("obj_9_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_9_cast_fp16 = batch_norm(beta = obj_9_beta_0_to_fp16, epsilon = obj_9_epsilon_0_to_fp16, gamma = obj_9_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_3_cast_fp16)[name = tensor("obj_9_cast_fp16")]; tensor var_305 = const()[name = tensor("op_305"), val = tensor([1, 1])]; tensor var_307 = const()[name = tensor("op_307"), val = tensor([1, 1])]; tensor query_3_pad_type_0 = const()[name = tensor("query_3_pad_type_0"), val = tensor("custom")]; tensor query_3_pad_0 = const()[name = tensor("query_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_0_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144434432))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145253696))), name = tensor("layers_0_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_0_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_0_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145253824)))]; tensor query_3_cast_fp16 = conv(bias = layers_0_encoder_attn_q_proj_bias_to_fp16, dilations = var_307, groups = var_183, pad = query_3_pad_0, pad_type = query_3_pad_type_0, strides = var_305, weight = layers_0_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_9_cast_fp16)[name = tensor("query_3_cast_fp16")]; tensor var_311 = const()[name = tensor("op_311"), val = tensor([1, 1])]; tensor var_313 = const()[name = tensor("op_313"), val = tensor([1, 1])]; tensor key_3_pad_type_0 = const()[name = tensor("key_3_pad_type_0"), val = tensor("custom")]; tensor key_3_pad_0 = const()[name = tensor("key_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_0_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(145256448))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146075712))), name = tensor("layers_0_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_3_cast_fp16 = conv(dilations = var_313, groups = var_183, pad = key_3_pad_0, pad_type = key_3_pad_type_0, strides = var_311, weight = layers_0_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_3_cast_fp16")]; tensor var_318 = const()[name = tensor("op_318"), val = tensor([1, 1])]; tensor var_320 = const()[name = tensor("op_320"), val = tensor([1, 1])]; tensor value_3_pad_type_0 = const()[name = tensor("value_3_pad_type_0"), val = tensor("custom")]; tensor value_3_pad_0 = const()[name = tensor("value_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_0_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146075840))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146895104))), name = tensor("layers_0_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_0_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_0_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146895232)))]; tensor value_3_cast_fp16 = conv(bias = layers_0_encoder_attn_v_proj_bias_to_fp16, dilations = var_320, groups = var_183, pad = value_3_pad_0, pad_type = value_3_pad_type_0, strides = var_318, weight = layers_0_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_3_cast_fp16")]; tensor var_324 = const()[name = tensor("op_324"), val = tensor([1, 20, 64, -1])]; tensor var_325_cast_fp16 = reshape(shape = var_324, x = query_3_cast_fp16)[name = tensor("op_325_cast_fp16")]; tensor var_326_to_fp16 = const()[name = tensor("op_326_to_fp16"), val = tensor(0x1p-3)]; tensor var_327_cast_fp16 = mul(x = var_325_cast_fp16, y = var_326_to_fp16)[name = tensor("op_327_cast_fp16")]; tensor var_328 = const()[name = tensor("op_328"), val = tensor([1, 20, 64, -1])]; tensor var_329_cast_fp16 = reshape(shape = var_328, x = key_3_cast_fp16)[name = tensor("op_329_cast_fp16")]; tensor mh_w_5_transpose_x_0 = const()[name = tensor("mh_w_5_transpose_x_0"), val = tensor(true)]; tensor mh_w_5_transpose_y_0 = const()[name = tensor("mh_w_5_transpose_y_0"), val = tensor(false)]; tensor mh_w_5_cast_fp16 = matmul(transpose_x = mh_w_5_transpose_x_0, transpose_y = mh_w_5_transpose_y_0, x = var_327_cast_fp16, y = var_329_cast_fp16)[name = tensor("mh_w_5_cast_fp16")]; tensor var_332_cast_fp16 = softmax(axis = var_176, x = mh_w_5_cast_fp16)[name = tensor("op_332_cast_fp16")]; tensor var_333 = const()[name = tensor("op_333"), val = tensor([1, 20, 64, -1])]; tensor var_334_cast_fp16 = reshape(shape = var_333, x = value_3_cast_fp16)[name = tensor("op_334_cast_fp16")]; tensor attn_3_transpose_x_0 = const()[name = tensor("attn_3_transpose_x_0"), val = tensor(false)]; tensor attn_3_transpose_y_0 = const()[name = tensor("attn_3_transpose_y_0"), val = tensor(true)]; tensor attn_3_cast_fp16 = matmul(transpose_x = attn_3_transpose_x_0, transpose_y = attn_3_transpose_y_0, x = var_334_cast_fp16, y = var_332_cast_fp16)[name = tensor("attn_3_cast_fp16")]; tensor var_337 = const()[name = tensor("op_337"), val = tensor([1, 1280, 1, -1])]; tensor input_3_cast_fp16 = reshape(shape = var_337, x = attn_3_cast_fp16)[name = tensor("input_3_cast_fp16")]; tensor var_341 = const()[name = tensor("op_341"), val = tensor([1, 1])]; tensor var_343 = const()[name = tensor("op_343"), val = tensor([1, 1])]; tensor obj_11_pad_type_0 = const()[name = tensor("obj_11_pad_type_0"), val = tensor("custom")]; tensor obj_11_pad_0 = const()[name = tensor("obj_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_0_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(146897856))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148126720))), name = tensor("layers_0_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_0_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_0_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148126912)))]; tensor obj_11_cast_fp16 = conv(bias = layers_0_encoder_attn_o_proj_bias_to_fp16, dilations = var_343, groups = var_183, pad = obj_11_pad_0, pad_type = obj_11_pad_type_0, strides = var_341, weight = layers_0_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_3_cast_fp16)[name = tensor("obj_11_cast_fp16")]; tensor inputs_5_cast_fp16 = add(x = inputs_3_cast_fp16, y = obj_11_cast_fp16)[name = tensor("inputs_5_cast_fp16")]; tensor var_349 = const()[name = tensor("op_349"), val = tensor([1])]; tensor channels_mean_5_cast_fp16 = reduce_mean(axes = var_349, keep_dims = var_184, x = inputs_5_cast_fp16)[name = tensor("channels_mean_5_cast_fp16")]; tensor zero_mean_5_cast_fp16 = sub(x = inputs_5_cast_fp16, y = channels_mean_5_cast_fp16)[name = tensor("zero_mean_5_cast_fp16")]; tensor zero_mean_sq_5_cast_fp16 = mul(x = zero_mean_5_cast_fp16, y = zero_mean_5_cast_fp16)[name = tensor("zero_mean_sq_5_cast_fp16")]; tensor var_353 = const()[name = tensor("op_353"), val = tensor([1])]; tensor var_354_cast_fp16 = reduce_mean(axes = var_353, keep_dims = var_184, x = zero_mean_sq_5_cast_fp16)[name = tensor("op_354_cast_fp16")]; tensor var_355_to_fp16 = const()[name = tensor("op_355_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_356_cast_fp16 = add(x = var_354_cast_fp16, y = var_355_to_fp16)[name = tensor("op_356_cast_fp16")]; tensor denom_5_epsilon_0 = const()[name = tensor("denom_5_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_5_cast_fp16 = rsqrt(epsilon = denom_5_epsilon_0, x = var_356_cast_fp16)[name = tensor("denom_5_cast_fp16")]; tensor out_5_cast_fp16 = mul(x = zero_mean_5_cast_fp16, y = denom_5_cast_fp16)[name = tensor("out_5_cast_fp16")]; tensor input_5_gamma_0_to_fp16 = const()[name = tensor("input_5_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148129536)))]; tensor input_5_beta_0_to_fp16 = const()[name = tensor("input_5_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148132160)))]; tensor input_5_epsilon_0_to_fp16 = const()[name = tensor("input_5_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_5_cast_fp16 = batch_norm(beta = input_5_beta_0_to_fp16, epsilon = input_5_epsilon_0_to_fp16, gamma = input_5_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_5_cast_fp16)[name = tensor("input_5_cast_fp16")]; tensor var_367 = const()[name = tensor("op_367"), val = tensor([1, 1])]; tensor var_369 = const()[name = tensor("op_369"), val = tensor([1, 1])]; tensor input_7_pad_type_0 = const()[name = tensor("input_7_pad_type_0"), val = tensor("custom")]; tensor input_7_pad_0 = const()[name = tensor("input_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_0_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148134784))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151411648))), name = tensor("layers_0_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_0_fc1_bias_to_fp16 = const()[name = tensor("layers_0_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151411776)))]; tensor input_7_cast_fp16 = conv(bias = layers_0_fc1_bias_to_fp16, dilations = var_369, groups = var_183, pad = input_7_pad_0, pad_type = input_7_pad_type_0, strides = var_367, weight = layers_0_fc1_weight_to_fp16_palettized, x = input_5_cast_fp16)[name = tensor("input_7_cast_fp16")]; tensor input_9_mode_0 = const()[name = tensor("input_9_mode_0"), val = tensor("EXACT")]; tensor input_9_cast_fp16 = gelu(mode = input_9_mode_0, x = input_7_cast_fp16)[name = tensor("input_9_cast_fp16")]; tensor var_375 = const()[name = tensor("op_375"), val = tensor([1, 1])]; tensor var_377 = const()[name = tensor("op_377"), val = tensor([1, 1])]; tensor hidden_states_3_pad_type_0 = const()[name = tensor("hidden_states_3_pad_type_0"), val = tensor("custom")]; tensor hidden_states_3_pad_0 = const()[name = tensor("hidden_states_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_0_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151422080))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157975744))), name = tensor("layers_0_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_0_fc2_bias_to_fp16 = const()[name = tensor("layers_0_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157976320)))]; tensor hidden_states_3_cast_fp16 = conv(bias = layers_0_fc2_bias_to_fp16, dilations = var_377, groups = var_183, pad = hidden_states_3_pad_0, pad_type = hidden_states_3_pad_type_0, strides = var_375, weight = layers_0_fc2_weight_to_fp16_palettized, x = input_9_cast_fp16)[name = tensor("hidden_states_3_cast_fp16")]; tensor inputs_7_cast_fp16 = add(x = inputs_5_cast_fp16, y = hidden_states_3_cast_fp16)[name = tensor("inputs_7_cast_fp16")]; tensor var_390 = const()[name = tensor("op_390"), val = tensor(3)]; tensor var_397 = const()[name = tensor("op_397"), val = tensor(1)]; tensor var_398 = const()[name = tensor("op_398"), val = tensor(true)]; tensor var_410 = const()[name = tensor("op_410"), val = tensor([1])]; tensor channels_mean_7_cast_fp16 = reduce_mean(axes = var_410, keep_dims = var_398, x = inputs_7_cast_fp16)[name = tensor("channels_mean_7_cast_fp16")]; tensor zero_mean_7_cast_fp16 = sub(x = inputs_7_cast_fp16, y = channels_mean_7_cast_fp16)[name = tensor("zero_mean_7_cast_fp16")]; tensor zero_mean_sq_7_cast_fp16 = mul(x = zero_mean_7_cast_fp16, y = zero_mean_7_cast_fp16)[name = tensor("zero_mean_sq_7_cast_fp16")]; tensor var_414 = const()[name = tensor("op_414"), val = tensor([1])]; tensor var_415_cast_fp16 = reduce_mean(axes = var_414, keep_dims = var_398, x = zero_mean_sq_7_cast_fp16)[name = tensor("op_415_cast_fp16")]; tensor var_416_to_fp16 = const()[name = tensor("op_416_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_417_cast_fp16 = add(x = var_415_cast_fp16, y = var_416_to_fp16)[name = tensor("op_417_cast_fp16")]; tensor denom_7_epsilon_0 = const()[name = tensor("denom_7_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_7_cast_fp16 = rsqrt(epsilon = denom_7_epsilon_0, x = var_417_cast_fp16)[name = tensor("denom_7_cast_fp16")]; tensor out_7_cast_fp16 = mul(x = zero_mean_7_cast_fp16, y = denom_7_cast_fp16)[name = tensor("out_7_cast_fp16")]; tensor obj_13_gamma_0_to_fp16 = const()[name = tensor("obj_13_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157978944)))]; tensor obj_13_beta_0_to_fp16 = const()[name = tensor("obj_13_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157981568)))]; tensor obj_13_epsilon_0_to_fp16 = const()[name = tensor("obj_13_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_13_cast_fp16 = batch_norm(beta = obj_13_beta_0_to_fp16, epsilon = obj_13_epsilon_0_to_fp16, gamma = obj_13_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_7_cast_fp16)[name = tensor("obj_13_cast_fp16")]; tensor var_432 = const()[name = tensor("op_432"), val = tensor([1, 1])]; tensor var_434 = const()[name = tensor("op_434"), val = tensor([1, 1])]; tensor query_5_pad_type_0 = const()[name = tensor("query_5_pad_type_0"), val = tensor("custom")]; tensor query_5_pad_0 = const()[name = tensor("query_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_1_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(157984192))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158803456))), name = tensor("layers_1_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_1_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_1_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158803584)))]; tensor query_5_cast_fp16 = conv(bias = layers_1_self_attn_q_proj_bias_to_fp16, dilations = var_434, groups = var_397, pad = query_5_pad_0, pad_type = query_5_pad_type_0, strides = var_432, weight = layers_1_self_attn_q_proj_weight_to_fp16_palettized, x = obj_13_cast_fp16)[name = tensor("query_5_cast_fp16")]; tensor var_438 = const()[name = tensor("op_438"), val = tensor([1, 1])]; tensor var_440 = const()[name = tensor("op_440"), val = tensor([1, 1])]; tensor current_key_3_pad_type_0 = const()[name = tensor("current_key_3_pad_type_0"), val = tensor("custom")]; tensor current_key_3_pad_0 = const()[name = tensor("current_key_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_1_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(158806208))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159625472))), name = tensor("layers_1_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_3_cast_fp16 = conv(dilations = var_440, groups = var_397, pad = current_key_3_pad_0, pad_type = current_key_3_pad_type_0, strides = var_438, weight = layers_1_self_attn_k_proj_weight_to_fp16_palettized, x = obj_13_cast_fp16)[name = tensor("current_key_3_cast_fp16")]; tensor var_445 = const()[name = tensor("op_445"), val = tensor([1, 1])]; tensor var_447 = const()[name = tensor("op_447"), val = tensor([1, 1])]; tensor current_value_3_pad_type_0 = const()[name = tensor("current_value_3_pad_type_0"), val = tensor("custom")]; tensor current_value_3_pad_0 = const()[name = tensor("current_value_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_1_self_attn_v_proj_weight_to_fp16 = const()[name = tensor("layers_1_self_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159625600)))]; tensor layers_1_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_1_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(162902464)))]; tensor current_value_3_cast_fp16 = conv(bias = layers_1_self_attn_v_proj_bias_to_fp16, dilations = var_447, groups = var_397, pad = current_value_3_pad_0, pad_type = current_value_3_pad_type_0, strides = var_445, weight = layers_1_self_attn_v_proj_weight_to_fp16, x = obj_13_cast_fp16)[name = tensor("current_value_3_cast_fp16")]; tensor var_454_cast_fp16 = mul(x = current_key_3_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_454_cast_fp16")]; tensor var_456_cast_fp16 = mul(x = var_103_cast_fp16_1, y = var_241_cast_fp16)[name = tensor("op_456_cast_fp16")]; tensor key_5_cast_fp16 = add(x = var_454_cast_fp16, y = var_456_cast_fp16)[name = tensor("key_5_cast_fp16")]; tensor var_458_cast_fp16 = mul(x = current_value_3_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_458_cast_fp16")]; tensor var_460_cast_fp16 = mul(x = var_138_cast_fp16_1, y = var_241_cast_fp16)[name = tensor("op_460_cast_fp16")]; tensor value_5_cast_fp16 = add(x = var_458_cast_fp16, y = var_460_cast_fp16)[name = tensor("value_5_cast_fp16")]; tensor var_463 = const()[name = tensor("op_463"), val = tensor([1, 20, 64, -1])]; tensor var_464_cast_fp16 = reshape(shape = var_463, x = query_5_cast_fp16)[name = tensor("op_464_cast_fp16")]; tensor var_465_to_fp16 = const()[name = tensor("op_465_to_fp16"), val = tensor(0x1p-3)]; tensor var_466_cast_fp16 = mul(x = var_464_cast_fp16, y = var_465_to_fp16)[name = tensor("op_466_cast_fp16")]; tensor var_467 = const()[name = tensor("op_467"), val = tensor([1, 20, 64, -1])]; tensor var_468_cast_fp16 = reshape(shape = var_467, x = key_5_cast_fp16)[name = tensor("op_468_cast_fp16")]; tensor mh_w_7_transpose_x_0 = const()[name = tensor("mh_w_7_transpose_x_0"), val = tensor(true)]; tensor mh_w_7_transpose_y_0 = const()[name = tensor("mh_w_7_transpose_y_0"), val = tensor(false)]; tensor mh_w_7_cast_fp16 = matmul(transpose_x = mh_w_7_transpose_x_0, transpose_y = mh_w_7_transpose_y_0, x = var_466_cast_fp16, y = var_468_cast_fp16)[name = tensor("mh_w_7_cast_fp16")]; tensor mh_w_9_cast_fp16 = add(x = mh_w_7_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_9_cast_fp16")]; tensor var_476_cast_fp16 = softmax(axis = var_390, x = mh_w_9_cast_fp16)[name = tensor("op_476_cast_fp16")]; tensor var_477 = const()[name = tensor("op_477"), val = tensor([1, 20, 64, -1])]; tensor var_478_cast_fp16 = reshape(shape = var_477, x = value_5_cast_fp16)[name = tensor("op_478_cast_fp16")]; tensor attn_5_transpose_x_0 = const()[name = tensor("attn_5_transpose_x_0"), val = tensor(false)]; tensor attn_5_transpose_y_0 = const()[name = tensor("attn_5_transpose_y_0"), val = tensor(true)]; tensor attn_5_cast_fp16 = matmul(transpose_x = attn_5_transpose_x_0, transpose_y = attn_5_transpose_y_0, x = var_478_cast_fp16, y = var_476_cast_fp16)[name = tensor("attn_5_cast_fp16")]; tensor var_481 = const()[name = tensor("op_481"), val = tensor([1, 1280, 1, -1])]; tensor input_11_cast_fp16 = reshape(shape = var_481, x = attn_5_cast_fp16)[name = tensor("input_11_cast_fp16")]; tensor var_485 = const()[name = tensor("op_485"), val = tensor([1, 1])]; tensor var_487 = const()[name = tensor("op_487"), val = tensor([1, 1])]; tensor obj_19_pad_type_0 = const()[name = tensor("obj_19_pad_type_0"), val = tensor("custom")]; tensor obj_19_pad_0 = const()[name = tensor("obj_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_1_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(162905088))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164133952))), name = tensor("layers_1_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_1_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_1_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164134144)))]; tensor obj_19_cast_fp16 = conv(bias = layers_1_self_attn_o_proj_bias_to_fp16, dilations = var_487, groups = var_397, pad = obj_19_pad_0, pad_type = obj_19_pad_type_0, strides = var_485, weight = layers_1_self_attn_o_proj_weight_to_fp16_palettized, x = input_11_cast_fp16)[name = tensor("obj_19_cast_fp16")]; tensor inputs_9_cast_fp16 = add(x = inputs_7_cast_fp16, y = obj_19_cast_fp16)[name = tensor("inputs_9_cast_fp16")]; tensor var_497 = const()[name = tensor("op_497"), val = tensor([1])]; tensor channels_mean_9_cast_fp16 = reduce_mean(axes = var_497, keep_dims = var_398, x = inputs_9_cast_fp16)[name = tensor("channels_mean_9_cast_fp16")]; tensor zero_mean_9_cast_fp16 = sub(x = inputs_9_cast_fp16, y = channels_mean_9_cast_fp16)[name = tensor("zero_mean_9_cast_fp16")]; tensor zero_mean_sq_9_cast_fp16 = mul(x = zero_mean_9_cast_fp16, y = zero_mean_9_cast_fp16)[name = tensor("zero_mean_sq_9_cast_fp16")]; tensor var_501 = const()[name = tensor("op_501"), val = tensor([1])]; tensor var_502_cast_fp16 = reduce_mean(axes = var_501, keep_dims = var_398, x = zero_mean_sq_9_cast_fp16)[name = tensor("op_502_cast_fp16")]; tensor var_503_to_fp16 = const()[name = tensor("op_503_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_504_cast_fp16 = add(x = var_502_cast_fp16, y = var_503_to_fp16)[name = tensor("op_504_cast_fp16")]; tensor denom_9_epsilon_0 = const()[name = tensor("denom_9_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_9_cast_fp16 = rsqrt(epsilon = denom_9_epsilon_0, x = var_504_cast_fp16)[name = tensor("denom_9_cast_fp16")]; tensor out_9_cast_fp16 = mul(x = zero_mean_9_cast_fp16, y = denom_9_cast_fp16)[name = tensor("out_9_cast_fp16")]; tensor obj_21_gamma_0_to_fp16 = const()[name = tensor("obj_21_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164136768)))]; tensor obj_21_beta_0_to_fp16 = const()[name = tensor("obj_21_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164139392)))]; tensor obj_21_epsilon_0_to_fp16 = const()[name = tensor("obj_21_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_21_cast_fp16 = batch_norm(beta = obj_21_beta_0_to_fp16, epsilon = obj_21_epsilon_0_to_fp16, gamma = obj_21_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_9_cast_fp16)[name = tensor("obj_21_cast_fp16")]; tensor var_519 = const()[name = tensor("op_519"), val = tensor([1, 1])]; tensor var_521 = const()[name = tensor("op_521"), val = tensor([1, 1])]; tensor query_7_pad_type_0 = const()[name = tensor("query_7_pad_type_0"), val = tensor("custom")]; tensor query_7_pad_0 = const()[name = tensor("query_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_1_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164142016))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164961280))), name = tensor("layers_1_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_1_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_1_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164961408)))]; tensor query_7_cast_fp16 = conv(bias = layers_1_encoder_attn_q_proj_bias_to_fp16, dilations = var_521, groups = var_397, pad = query_7_pad_0, pad_type = query_7_pad_type_0, strides = var_519, weight = layers_1_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_21_cast_fp16)[name = tensor("query_7_cast_fp16")]; tensor var_525 = const()[name = tensor("op_525"), val = tensor([1, 1])]; tensor var_527 = const()[name = tensor("op_527"), val = tensor([1, 1])]; tensor key_7_pad_type_0 = const()[name = tensor("key_7_pad_type_0"), val = tensor("custom")]; tensor key_7_pad_0 = const()[name = tensor("key_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_1_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(164964032))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165783296))), name = tensor("layers_1_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_7_cast_fp16 = conv(dilations = var_527, groups = var_397, pad = key_7_pad_0, pad_type = key_7_pad_type_0, strides = var_525, weight = layers_1_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_7_cast_fp16")]; tensor var_532 = const()[name = tensor("op_532"), val = tensor([1, 1])]; tensor var_534 = const()[name = tensor("op_534"), val = tensor([1, 1])]; tensor value_7_pad_type_0 = const()[name = tensor("value_7_pad_type_0"), val = tensor("custom")]; tensor value_7_pad_0 = const()[name = tensor("value_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_1_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165783424))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166602688))), name = tensor("layers_1_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_1_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_1_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166602816)))]; tensor value_7_cast_fp16 = conv(bias = layers_1_encoder_attn_v_proj_bias_to_fp16, dilations = var_534, groups = var_397, pad = value_7_pad_0, pad_type = value_7_pad_type_0, strides = var_532, weight = layers_1_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_7_cast_fp16")]; tensor var_538 = const()[name = tensor("op_538"), val = tensor([1, 20, 64, -1])]; tensor var_539_cast_fp16 = reshape(shape = var_538, x = query_7_cast_fp16)[name = tensor("op_539_cast_fp16")]; tensor var_540_to_fp16 = const()[name = tensor("op_540_to_fp16"), val = tensor(0x1p-3)]; tensor var_541_cast_fp16 = mul(x = var_539_cast_fp16, y = var_540_to_fp16)[name = tensor("op_541_cast_fp16")]; tensor var_542 = const()[name = tensor("op_542"), val = tensor([1, 20, 64, -1])]; tensor var_543_cast_fp16 = reshape(shape = var_542, x = key_7_cast_fp16)[name = tensor("op_543_cast_fp16")]; tensor mh_w_11_transpose_x_0 = const()[name = tensor("mh_w_11_transpose_x_0"), val = tensor(true)]; tensor mh_w_11_transpose_y_0 = const()[name = tensor("mh_w_11_transpose_y_0"), val = tensor(false)]; tensor mh_w_11_cast_fp16 = matmul(transpose_x = mh_w_11_transpose_x_0, transpose_y = mh_w_11_transpose_y_0, x = var_541_cast_fp16, y = var_543_cast_fp16)[name = tensor("mh_w_11_cast_fp16")]; tensor var_546_cast_fp16 = softmax(axis = var_390, x = mh_w_11_cast_fp16)[name = tensor("op_546_cast_fp16")]; tensor var_547 = const()[name = tensor("op_547"), val = tensor([1, 20, 64, -1])]; tensor var_548_cast_fp16 = reshape(shape = var_547, x = value_7_cast_fp16)[name = tensor("op_548_cast_fp16")]; tensor attn_7_transpose_x_0 = const()[name = tensor("attn_7_transpose_x_0"), val = tensor(false)]; tensor attn_7_transpose_y_0 = const()[name = tensor("attn_7_transpose_y_0"), val = tensor(true)]; tensor attn_7_cast_fp16 = matmul(transpose_x = attn_7_transpose_x_0, transpose_y = attn_7_transpose_y_0, x = var_548_cast_fp16, y = var_546_cast_fp16)[name = tensor("attn_7_cast_fp16")]; tensor var_551 = const()[name = tensor("op_551"), val = tensor([1, 1280, 1, -1])]; tensor input_13_cast_fp16 = reshape(shape = var_551, x = attn_7_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor var_555 = const()[name = tensor("op_555"), val = tensor([1, 1])]; tensor var_557 = const()[name = tensor("op_557"), val = tensor([1, 1])]; tensor obj_23_pad_type_0 = const()[name = tensor("obj_23_pad_type_0"), val = tensor("custom")]; tensor obj_23_pad_0 = const()[name = tensor("obj_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_1_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166605440))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167834304))), name = tensor("layers_1_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_1_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_1_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167834496)))]; tensor obj_23_cast_fp16 = conv(bias = layers_1_encoder_attn_o_proj_bias_to_fp16, dilations = var_557, groups = var_397, pad = obj_23_pad_0, pad_type = obj_23_pad_type_0, strides = var_555, weight = layers_1_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_13_cast_fp16)[name = tensor("obj_23_cast_fp16")]; tensor inputs_11_cast_fp16 = add(x = inputs_9_cast_fp16, y = obj_23_cast_fp16)[name = tensor("inputs_11_cast_fp16")]; tensor var_563 = const()[name = tensor("op_563"), val = tensor([1])]; tensor channels_mean_11_cast_fp16 = reduce_mean(axes = var_563, keep_dims = var_398, x = inputs_11_cast_fp16)[name = tensor("channels_mean_11_cast_fp16")]; tensor zero_mean_11_cast_fp16 = sub(x = inputs_11_cast_fp16, y = channels_mean_11_cast_fp16)[name = tensor("zero_mean_11_cast_fp16")]; tensor zero_mean_sq_11_cast_fp16 = mul(x = zero_mean_11_cast_fp16, y = zero_mean_11_cast_fp16)[name = tensor("zero_mean_sq_11_cast_fp16")]; tensor var_567 = const()[name = tensor("op_567"), val = tensor([1])]; tensor var_568_cast_fp16 = reduce_mean(axes = var_567, keep_dims = var_398, x = zero_mean_sq_11_cast_fp16)[name = tensor("op_568_cast_fp16")]; tensor var_569_to_fp16 = const()[name = tensor("op_569_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_570_cast_fp16 = add(x = var_568_cast_fp16, y = var_569_to_fp16)[name = tensor("op_570_cast_fp16")]; tensor denom_11_epsilon_0 = const()[name = tensor("denom_11_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_11_cast_fp16 = rsqrt(epsilon = denom_11_epsilon_0, x = var_570_cast_fp16)[name = tensor("denom_11_cast_fp16")]; tensor out_11_cast_fp16 = mul(x = zero_mean_11_cast_fp16, y = denom_11_cast_fp16)[name = tensor("out_11_cast_fp16")]; tensor input_15_gamma_0_to_fp16 = const()[name = tensor("input_15_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167837120)))]; tensor input_15_beta_0_to_fp16 = const()[name = tensor("input_15_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167839744)))]; tensor input_15_epsilon_0_to_fp16 = const()[name = tensor("input_15_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_15_cast_fp16 = batch_norm(beta = input_15_beta_0_to_fp16, epsilon = input_15_epsilon_0_to_fp16, gamma = input_15_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_11_cast_fp16)[name = tensor("input_15_cast_fp16")]; tensor var_581 = const()[name = tensor("op_581"), val = tensor([1, 1])]; tensor var_583 = const()[name = tensor("op_583"), val = tensor([1, 1])]; tensor input_17_pad_type_0 = const()[name = tensor("input_17_pad_type_0"), val = tensor("custom")]; tensor input_17_pad_0 = const()[name = tensor("input_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_1_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167842368))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172757632))), name = tensor("layers_1_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_1_fc1_bias_to_fp16 = const()[name = tensor("layers_1_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172757824)))]; tensor input_17_cast_fp16 = conv(bias = layers_1_fc1_bias_to_fp16, dilations = var_583, groups = var_397, pad = input_17_pad_0, pad_type = input_17_pad_type_0, strides = var_581, weight = layers_1_fc1_weight_to_fp16_palettized, x = input_15_cast_fp16)[name = tensor("input_17_cast_fp16")]; tensor input_19_mode_0 = const()[name = tensor("input_19_mode_0"), val = tensor("EXACT")]; tensor input_19_cast_fp16 = gelu(mode = input_19_mode_0, x = input_17_cast_fp16)[name = tensor("input_19_cast_fp16")]; tensor var_589 = const()[name = tensor("op_589"), val = tensor([1, 1])]; tensor var_591 = const()[name = tensor("op_591"), val = tensor([1, 1])]; tensor hidden_states_5_pad_type_0 = const()[name = tensor("hidden_states_5_pad_type_0"), val = tensor("custom")]; tensor hidden_states_5_pad_0 = const()[name = tensor("hidden_states_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_1_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172768128))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177683392))), name = tensor("layers_1_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_1_fc2_bias_to_fp16 = const()[name = tensor("layers_1_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177683584)))]; tensor hidden_states_5_cast_fp16 = conv(bias = layers_1_fc2_bias_to_fp16, dilations = var_591, groups = var_397, pad = hidden_states_5_pad_0, pad_type = hidden_states_5_pad_type_0, strides = var_589, weight = layers_1_fc2_weight_to_fp16_palettized, x = input_19_cast_fp16)[name = tensor("hidden_states_5_cast_fp16")]; tensor inputs_13_cast_fp16 = add(x = inputs_11_cast_fp16, y = hidden_states_5_cast_fp16)[name = tensor("inputs_13_cast_fp16")]; tensor var_604 = const()[name = tensor("op_604"), val = tensor(3)]; tensor var_611 = const()[name = tensor("op_611"), val = tensor(1)]; tensor var_612 = const()[name = tensor("op_612"), val = tensor(true)]; tensor var_624 = const()[name = tensor("op_624"), val = tensor([1])]; tensor channels_mean_13_cast_fp16 = reduce_mean(axes = var_624, keep_dims = var_612, x = inputs_13_cast_fp16)[name = tensor("channels_mean_13_cast_fp16")]; tensor zero_mean_13_cast_fp16 = sub(x = inputs_13_cast_fp16, y = channels_mean_13_cast_fp16)[name = tensor("zero_mean_13_cast_fp16")]; tensor zero_mean_sq_13_cast_fp16 = mul(x = zero_mean_13_cast_fp16, y = zero_mean_13_cast_fp16)[name = tensor("zero_mean_sq_13_cast_fp16")]; tensor var_628 = const()[name = tensor("op_628"), val = tensor([1])]; tensor var_629_cast_fp16 = reduce_mean(axes = var_628, keep_dims = var_612, x = zero_mean_sq_13_cast_fp16)[name = tensor("op_629_cast_fp16")]; tensor var_630_to_fp16 = const()[name = tensor("op_630_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_631_cast_fp16 = add(x = var_629_cast_fp16, y = var_630_to_fp16)[name = tensor("op_631_cast_fp16")]; tensor denom_13_epsilon_0 = const()[name = tensor("denom_13_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_13_cast_fp16 = rsqrt(epsilon = denom_13_epsilon_0, x = var_631_cast_fp16)[name = tensor("denom_13_cast_fp16")]; tensor out_13_cast_fp16 = mul(x = zero_mean_13_cast_fp16, y = denom_13_cast_fp16)[name = tensor("out_13_cast_fp16")]; tensor obj_25_gamma_0_to_fp16 = const()[name = tensor("obj_25_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177686208)))]; tensor obj_25_beta_0_to_fp16 = const()[name = tensor("obj_25_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177688832)))]; tensor obj_25_epsilon_0_to_fp16 = const()[name = tensor("obj_25_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_25_cast_fp16 = batch_norm(beta = obj_25_beta_0_to_fp16, epsilon = obj_25_epsilon_0_to_fp16, gamma = obj_25_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_13_cast_fp16)[name = tensor("obj_25_cast_fp16")]; tensor var_646 = const()[name = tensor("op_646"), val = tensor([1, 1])]; tensor var_648 = const()[name = tensor("op_648"), val = tensor([1, 1])]; tensor query_9_pad_type_0 = const()[name = tensor("query_9_pad_type_0"), val = tensor("custom")]; tensor query_9_pad_0 = const()[name = tensor("query_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_2_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177691456))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178510720))), name = tensor("layers_2_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_2_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_2_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178510848)))]; tensor query_9_cast_fp16 = conv(bias = layers_2_self_attn_q_proj_bias_to_fp16, dilations = var_648, groups = var_611, pad = query_9_pad_0, pad_type = query_9_pad_type_0, strides = var_646, weight = layers_2_self_attn_q_proj_weight_to_fp16_palettized, x = obj_25_cast_fp16)[name = tensor("query_9_cast_fp16")]; tensor var_652 = const()[name = tensor("op_652"), val = tensor([1, 1])]; tensor var_654 = const()[name = tensor("op_654"), val = tensor([1, 1])]; tensor current_key_5_pad_type_0 = const()[name = tensor("current_key_5_pad_type_0"), val = tensor("custom")]; tensor current_key_5_pad_0 = const()[name = tensor("current_key_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_2_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178513472))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179332736))), name = tensor("layers_2_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_5_cast_fp16 = conv(dilations = var_654, groups = var_611, pad = current_key_5_pad_0, pad_type = current_key_5_pad_type_0, strides = var_652, weight = layers_2_self_attn_k_proj_weight_to_fp16_palettized, x = obj_25_cast_fp16)[name = tensor("current_key_5_cast_fp16")]; tensor var_659 = const()[name = tensor("op_659"), val = tensor([1, 1])]; tensor var_661 = const()[name = tensor("op_661"), val = tensor([1, 1])]; tensor current_value_5_pad_type_0 = const()[name = tensor("current_value_5_pad_type_0"), val = tensor("custom")]; tensor current_value_5_pad_0 = const()[name = tensor("current_value_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_2_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(179332864))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180152128))), name = tensor("layers_2_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_2_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_2_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180152256)))]; tensor current_value_5_cast_fp16 = conv(bias = layers_2_self_attn_v_proj_bias_to_fp16, dilations = var_661, groups = var_611, pad = current_value_5_pad_0, pad_type = current_value_5_pad_type_0, strides = var_659, weight = layers_2_self_attn_v_proj_weight_to_fp16_palettized, x = obj_25_cast_fp16)[name = tensor("current_value_5_cast_fp16")]; tensor var_668_cast_fp16 = mul(x = current_key_5_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_668_cast_fp16")]; tensor var_670_cast_fp16 = mul(x = var_103_cast_fp16_2, y = var_241_cast_fp16)[name = tensor("op_670_cast_fp16")]; tensor key_9_cast_fp16 = add(x = var_668_cast_fp16, y = var_670_cast_fp16)[name = tensor("key_9_cast_fp16")]; tensor var_672_cast_fp16 = mul(x = current_value_5_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_672_cast_fp16")]; tensor var_674_cast_fp16 = mul(x = var_138_cast_fp16_2, y = var_241_cast_fp16)[name = tensor("op_674_cast_fp16")]; tensor value_9_cast_fp16 = add(x = var_672_cast_fp16, y = var_674_cast_fp16)[name = tensor("value_9_cast_fp16")]; tensor var_677 = const()[name = tensor("op_677"), val = tensor([1, 20, 64, -1])]; tensor var_678_cast_fp16 = reshape(shape = var_677, x = query_9_cast_fp16)[name = tensor("op_678_cast_fp16")]; tensor var_679_to_fp16 = const()[name = tensor("op_679_to_fp16"), val = tensor(0x1p-3)]; tensor var_680_cast_fp16 = mul(x = var_678_cast_fp16, y = var_679_to_fp16)[name = tensor("op_680_cast_fp16")]; tensor var_681 = const()[name = tensor("op_681"), val = tensor([1, 20, 64, -1])]; tensor var_682_cast_fp16 = reshape(shape = var_681, x = key_9_cast_fp16)[name = tensor("op_682_cast_fp16")]; tensor mh_w_13_transpose_x_0 = const()[name = tensor("mh_w_13_transpose_x_0"), val = tensor(true)]; tensor mh_w_13_transpose_y_0 = const()[name = tensor("mh_w_13_transpose_y_0"), val = tensor(false)]; tensor mh_w_13_cast_fp16 = matmul(transpose_x = mh_w_13_transpose_x_0, transpose_y = mh_w_13_transpose_y_0, x = var_680_cast_fp16, y = var_682_cast_fp16)[name = tensor("mh_w_13_cast_fp16")]; tensor mh_w_15_cast_fp16 = add(x = mh_w_13_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_15_cast_fp16")]; tensor var_690_cast_fp16 = softmax(axis = var_604, x = mh_w_15_cast_fp16)[name = tensor("op_690_cast_fp16")]; tensor var_691 = const()[name = tensor("op_691"), val = tensor([1, 20, 64, -1])]; tensor var_692_cast_fp16 = reshape(shape = var_691, x = value_9_cast_fp16)[name = tensor("op_692_cast_fp16")]; tensor attn_9_transpose_x_0 = const()[name = tensor("attn_9_transpose_x_0"), val = tensor(false)]; tensor attn_9_transpose_y_0 = const()[name = tensor("attn_9_transpose_y_0"), val = tensor(true)]; tensor attn_9_cast_fp16 = matmul(transpose_x = attn_9_transpose_x_0, transpose_y = attn_9_transpose_y_0, x = var_692_cast_fp16, y = var_690_cast_fp16)[name = tensor("attn_9_cast_fp16")]; tensor var_695 = const()[name = tensor("op_695"), val = tensor([1, 1280, 1, -1])]; tensor input_21_cast_fp16 = reshape(shape = var_695, x = attn_9_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor var_699 = const()[name = tensor("op_699"), val = tensor([1, 1])]; tensor var_701 = const()[name = tensor("op_701"), val = tensor([1, 1])]; tensor obj_31_pad_type_0 = const()[name = tensor("obj_31_pad_type_0"), val = tensor("custom")]; tensor obj_31_pad_0 = const()[name = tensor("obj_31_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_2_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(180154880))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181793344))), name = tensor("layers_2_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_2_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_2_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181793920)))]; tensor obj_31_cast_fp16 = conv(bias = layers_2_self_attn_o_proj_bias_to_fp16, dilations = var_701, groups = var_611, pad = obj_31_pad_0, pad_type = obj_31_pad_type_0, strides = var_699, weight = layers_2_self_attn_o_proj_weight_to_fp16_palettized, x = input_21_cast_fp16)[name = tensor("obj_31_cast_fp16")]; tensor inputs_15_cast_fp16 = add(x = inputs_13_cast_fp16, y = obj_31_cast_fp16)[name = tensor("inputs_15_cast_fp16")]; tensor var_711 = const()[name = tensor("op_711"), val = tensor([1])]; tensor channels_mean_15_cast_fp16 = reduce_mean(axes = var_711, keep_dims = var_612, x = inputs_15_cast_fp16)[name = tensor("channels_mean_15_cast_fp16")]; tensor zero_mean_15_cast_fp16 = sub(x = inputs_15_cast_fp16, y = channels_mean_15_cast_fp16)[name = tensor("zero_mean_15_cast_fp16")]; tensor zero_mean_sq_15_cast_fp16 = mul(x = zero_mean_15_cast_fp16, y = zero_mean_15_cast_fp16)[name = tensor("zero_mean_sq_15_cast_fp16")]; tensor var_715 = const()[name = tensor("op_715"), val = tensor([1])]; tensor var_716_cast_fp16 = reduce_mean(axes = var_715, keep_dims = var_612, x = zero_mean_sq_15_cast_fp16)[name = tensor("op_716_cast_fp16")]; tensor var_717_to_fp16 = const()[name = tensor("op_717_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_718_cast_fp16 = add(x = var_716_cast_fp16, y = var_717_to_fp16)[name = tensor("op_718_cast_fp16")]; tensor denom_15_epsilon_0 = const()[name = tensor("denom_15_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_15_cast_fp16 = rsqrt(epsilon = denom_15_epsilon_0, x = var_718_cast_fp16)[name = tensor("denom_15_cast_fp16")]; tensor out_15_cast_fp16 = mul(x = zero_mean_15_cast_fp16, y = denom_15_cast_fp16)[name = tensor("out_15_cast_fp16")]; tensor obj_33_gamma_0_to_fp16 = const()[name = tensor("obj_33_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181796544)))]; tensor obj_33_beta_0_to_fp16 = const()[name = tensor("obj_33_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181799168)))]; tensor obj_33_epsilon_0_to_fp16 = const()[name = tensor("obj_33_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_33_cast_fp16 = batch_norm(beta = obj_33_beta_0_to_fp16, epsilon = obj_33_epsilon_0_to_fp16, gamma = obj_33_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_15_cast_fp16)[name = tensor("obj_33_cast_fp16")]; tensor var_733 = const()[name = tensor("op_733"), val = tensor([1, 1])]; tensor var_735 = const()[name = tensor("op_735"), val = tensor([1, 1])]; tensor query_11_pad_type_0 = const()[name = tensor("query_11_pad_type_0"), val = tensor("custom")]; tensor query_11_pad_0 = const()[name = tensor("query_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_2_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(181801792))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182621056))), name = tensor("layers_2_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_2_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_2_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182621184)))]; tensor query_11_cast_fp16 = conv(bias = layers_2_encoder_attn_q_proj_bias_to_fp16, dilations = var_735, groups = var_611, pad = query_11_pad_0, pad_type = query_11_pad_type_0, strides = var_733, weight = layers_2_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_33_cast_fp16)[name = tensor("query_11_cast_fp16")]; tensor var_739 = const()[name = tensor("op_739"), val = tensor([1, 1])]; tensor var_741 = const()[name = tensor("op_741"), val = tensor([1, 1])]; tensor key_11_pad_type_0 = const()[name = tensor("key_11_pad_type_0"), val = tensor("custom")]; tensor key_11_pad_0 = const()[name = tensor("key_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_2_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(182623808))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183443072))), name = tensor("layers_2_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_11_cast_fp16 = conv(dilations = var_741, groups = var_611, pad = key_11_pad_0, pad_type = key_11_pad_type_0, strides = var_739, weight = layers_2_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_11_cast_fp16")]; tensor var_746 = const()[name = tensor("op_746"), val = tensor([1, 1])]; tensor var_748 = const()[name = tensor("op_748"), val = tensor([1, 1])]; tensor value_11_pad_type_0 = const()[name = tensor("value_11_pad_type_0"), val = tensor("custom")]; tensor value_11_pad_0 = const()[name = tensor("value_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_2_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(183443200))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184262464))), name = tensor("layers_2_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_2_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_2_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184262592)))]; tensor value_11_cast_fp16 = conv(bias = layers_2_encoder_attn_v_proj_bias_to_fp16, dilations = var_748, groups = var_611, pad = value_11_pad_0, pad_type = value_11_pad_type_0, strides = var_746, weight = layers_2_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_11_cast_fp16")]; tensor var_752 = const()[name = tensor("op_752"), val = tensor([1, 20, 64, -1])]; tensor var_753_cast_fp16 = reshape(shape = var_752, x = query_11_cast_fp16)[name = tensor("op_753_cast_fp16")]; tensor var_754_to_fp16 = const()[name = tensor("op_754_to_fp16"), val = tensor(0x1p-3)]; tensor var_755_cast_fp16 = mul(x = var_753_cast_fp16, y = var_754_to_fp16)[name = tensor("op_755_cast_fp16")]; tensor var_756 = const()[name = tensor("op_756"), val = tensor([1, 20, 64, -1])]; tensor var_757_cast_fp16 = reshape(shape = var_756, x = key_11_cast_fp16)[name = tensor("op_757_cast_fp16")]; tensor mh_w_17_transpose_x_0 = const()[name = tensor("mh_w_17_transpose_x_0"), val = tensor(true)]; tensor mh_w_17_transpose_y_0 = const()[name = tensor("mh_w_17_transpose_y_0"), val = tensor(false)]; tensor mh_w_17_cast_fp16 = matmul(transpose_x = mh_w_17_transpose_x_0, transpose_y = mh_w_17_transpose_y_0, x = var_755_cast_fp16, y = var_757_cast_fp16)[name = tensor("mh_w_17_cast_fp16")]; tensor var_760_cast_fp16 = softmax(axis = var_604, x = mh_w_17_cast_fp16)[name = tensor("op_760_cast_fp16")]; tensor var_761 = const()[name = tensor("op_761"), val = tensor([1, 20, 64, -1])]; tensor var_762_cast_fp16 = reshape(shape = var_761, x = value_11_cast_fp16)[name = tensor("op_762_cast_fp16")]; tensor attn_11_transpose_x_0 = const()[name = tensor("attn_11_transpose_x_0"), val = tensor(false)]; tensor attn_11_transpose_y_0 = const()[name = tensor("attn_11_transpose_y_0"), val = tensor(true)]; tensor attn_11_cast_fp16 = matmul(transpose_x = attn_11_transpose_x_0, transpose_y = attn_11_transpose_y_0, x = var_762_cast_fp16, y = var_760_cast_fp16)[name = tensor("attn_11_cast_fp16")]; tensor var_765 = const()[name = tensor("op_765"), val = tensor([1, 1280, 1, -1])]; tensor input_23_cast_fp16 = reshape(shape = var_765, x = attn_11_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor var_769 = const()[name = tensor("op_769"), val = tensor([1, 1])]; tensor var_771 = const()[name = tensor("op_771"), val = tensor([1, 1])]; tensor obj_35_pad_type_0 = const()[name = tensor("obj_35_pad_type_0"), val = tensor("custom")]; tensor obj_35_pad_0 = const()[name = tensor("obj_35_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_2_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184265216))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185084480))), name = tensor("layers_2_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_2_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_2_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185084608)))]; tensor obj_35_cast_fp16 = conv(bias = layers_2_encoder_attn_o_proj_bias_to_fp16, dilations = var_771, groups = var_611, pad = obj_35_pad_0, pad_type = obj_35_pad_type_0, strides = var_769, weight = layers_2_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_23_cast_fp16)[name = tensor("obj_35_cast_fp16")]; tensor inputs_17_cast_fp16 = add(x = inputs_15_cast_fp16, y = obj_35_cast_fp16)[name = tensor("inputs_17_cast_fp16")]; tensor var_777 = const()[name = tensor("op_777"), val = tensor([1])]; tensor channels_mean_17_cast_fp16 = reduce_mean(axes = var_777, keep_dims = var_612, x = inputs_17_cast_fp16)[name = tensor("channels_mean_17_cast_fp16")]; tensor zero_mean_17_cast_fp16 = sub(x = inputs_17_cast_fp16, y = channels_mean_17_cast_fp16)[name = tensor("zero_mean_17_cast_fp16")]; tensor zero_mean_sq_17_cast_fp16 = mul(x = zero_mean_17_cast_fp16, y = zero_mean_17_cast_fp16)[name = tensor("zero_mean_sq_17_cast_fp16")]; tensor var_781 = const()[name = tensor("op_781"), val = tensor([1])]; tensor var_782_cast_fp16 = reduce_mean(axes = var_781, keep_dims = var_612, x = zero_mean_sq_17_cast_fp16)[name = tensor("op_782_cast_fp16")]; tensor var_783_to_fp16 = const()[name = tensor("op_783_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_784_cast_fp16 = add(x = var_782_cast_fp16, y = var_783_to_fp16)[name = tensor("op_784_cast_fp16")]; tensor denom_17_epsilon_0 = const()[name = tensor("denom_17_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_17_cast_fp16 = rsqrt(epsilon = denom_17_epsilon_0, x = var_784_cast_fp16)[name = tensor("denom_17_cast_fp16")]; tensor out_17_cast_fp16 = mul(x = zero_mean_17_cast_fp16, y = denom_17_cast_fp16)[name = tensor("out_17_cast_fp16")]; tensor input_25_gamma_0_to_fp16 = const()[name = tensor("input_25_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185087232)))]; tensor input_25_beta_0_to_fp16 = const()[name = tensor("input_25_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185089856)))]; tensor input_25_epsilon_0_to_fp16 = const()[name = tensor("input_25_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_25_cast_fp16 = batch_norm(beta = input_25_beta_0_to_fp16, epsilon = input_25_epsilon_0_to_fp16, gamma = input_25_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_17_cast_fp16)[name = tensor("input_25_cast_fp16")]; tensor var_795 = const()[name = tensor("op_795"), val = tensor([1, 1])]; tensor var_797 = const()[name = tensor("op_797"), val = tensor([1, 1])]; tensor input_27_pad_type_0 = const()[name = tensor("input_27_pad_type_0"), val = tensor("custom")]; tensor input_27_pad_0 = const()[name = tensor("input_27_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_2_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185092480))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190007744))), name = tensor("layers_2_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_2_fc1_bias_to_fp16 = const()[name = tensor("layers_2_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190007936)))]; tensor input_27_cast_fp16 = conv(bias = layers_2_fc1_bias_to_fp16, dilations = var_797, groups = var_611, pad = input_27_pad_0, pad_type = input_27_pad_type_0, strides = var_795, weight = layers_2_fc1_weight_to_fp16_palettized, x = input_25_cast_fp16)[name = tensor("input_27_cast_fp16")]; tensor input_29_mode_0 = const()[name = tensor("input_29_mode_0"), val = tensor("EXACT")]; tensor input_29_cast_fp16 = gelu(mode = input_29_mode_0, x = input_27_cast_fp16)[name = tensor("input_29_cast_fp16")]; tensor var_803 = const()[name = tensor("op_803"), val = tensor([1, 1])]; tensor var_805 = const()[name = tensor("op_805"), val = tensor([1, 1])]; tensor hidden_states_7_pad_type_0 = const()[name = tensor("hidden_states_7_pad_type_0"), val = tensor("custom")]; tensor hidden_states_7_pad_0 = const()[name = tensor("hidden_states_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_2_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190018240))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194933504))), name = tensor("layers_2_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_2_fc2_bias_to_fp16 = const()[name = tensor("layers_2_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194933696)))]; tensor hidden_states_7_cast_fp16 = conv(bias = layers_2_fc2_bias_to_fp16, dilations = var_805, groups = var_611, pad = hidden_states_7_pad_0, pad_type = hidden_states_7_pad_type_0, strides = var_803, weight = layers_2_fc2_weight_to_fp16_palettized, x = input_29_cast_fp16)[name = tensor("hidden_states_7_cast_fp16")]; tensor inputs_19_cast_fp16 = add(x = inputs_17_cast_fp16, y = hidden_states_7_cast_fp16)[name = tensor("inputs_19_cast_fp16")]; tensor var_818 = const()[name = tensor("op_818"), val = tensor(3)]; tensor var_825 = const()[name = tensor("op_825"), val = tensor(1)]; tensor var_826 = const()[name = tensor("op_826"), val = tensor(true)]; tensor var_838 = const()[name = tensor("op_838"), val = tensor([1])]; tensor channels_mean_19_cast_fp16 = reduce_mean(axes = var_838, keep_dims = var_826, x = inputs_19_cast_fp16)[name = tensor("channels_mean_19_cast_fp16")]; tensor zero_mean_19_cast_fp16 = sub(x = inputs_19_cast_fp16, y = channels_mean_19_cast_fp16)[name = tensor("zero_mean_19_cast_fp16")]; tensor zero_mean_sq_19_cast_fp16 = mul(x = zero_mean_19_cast_fp16, y = zero_mean_19_cast_fp16)[name = tensor("zero_mean_sq_19_cast_fp16")]; tensor var_842 = const()[name = tensor("op_842"), val = tensor([1])]; tensor var_843_cast_fp16 = reduce_mean(axes = var_842, keep_dims = var_826, x = zero_mean_sq_19_cast_fp16)[name = tensor("op_843_cast_fp16")]; tensor var_844_to_fp16 = const()[name = tensor("op_844_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_845_cast_fp16 = add(x = var_843_cast_fp16, y = var_844_to_fp16)[name = tensor("op_845_cast_fp16")]; tensor denom_19_epsilon_0 = const()[name = tensor("denom_19_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_19_cast_fp16 = rsqrt(epsilon = denom_19_epsilon_0, x = var_845_cast_fp16)[name = tensor("denom_19_cast_fp16")]; tensor out_19_cast_fp16 = mul(x = zero_mean_19_cast_fp16, y = denom_19_cast_fp16)[name = tensor("out_19_cast_fp16")]; tensor obj_37_gamma_0_to_fp16 = const()[name = tensor("obj_37_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194936320)))]; tensor obj_37_beta_0_to_fp16 = const()[name = tensor("obj_37_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194938944)))]; tensor obj_37_epsilon_0_to_fp16 = const()[name = tensor("obj_37_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_37_cast_fp16 = batch_norm(beta = obj_37_beta_0_to_fp16, epsilon = obj_37_epsilon_0_to_fp16, gamma = obj_37_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_19_cast_fp16)[name = tensor("obj_37_cast_fp16")]; tensor var_860 = const()[name = tensor("op_860"), val = tensor([1, 1])]; tensor var_862 = const()[name = tensor("op_862"), val = tensor([1, 1])]; tensor query_13_pad_type_0 = const()[name = tensor("query_13_pad_type_0"), val = tensor("custom")]; tensor query_13_pad_0 = const()[name = tensor("query_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_3_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194941568))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195760832))), name = tensor("layers_3_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_3_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_3_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195760960)))]; tensor query_13_cast_fp16 = conv(bias = layers_3_self_attn_q_proj_bias_to_fp16, dilations = var_862, groups = var_825, pad = query_13_pad_0, pad_type = query_13_pad_type_0, strides = var_860, weight = layers_3_self_attn_q_proj_weight_to_fp16_palettized, x = obj_37_cast_fp16)[name = tensor("query_13_cast_fp16")]; tensor var_866 = const()[name = tensor("op_866"), val = tensor([1, 1])]; tensor var_868 = const()[name = tensor("op_868"), val = tensor([1, 1])]; tensor current_key_7_pad_type_0 = const()[name = tensor("current_key_7_pad_type_0"), val = tensor("custom")]; tensor current_key_7_pad_0 = const()[name = tensor("current_key_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_3_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(195763584))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196582848))), name = tensor("layers_3_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_7_cast_fp16 = conv(dilations = var_868, groups = var_825, pad = current_key_7_pad_0, pad_type = current_key_7_pad_type_0, strides = var_866, weight = layers_3_self_attn_k_proj_weight_to_fp16_palettized, x = obj_37_cast_fp16)[name = tensor("current_key_7_cast_fp16")]; tensor var_873 = const()[name = tensor("op_873"), val = tensor([1, 1])]; tensor var_875 = const()[name = tensor("op_875"), val = tensor([1, 1])]; tensor current_value_7_pad_type_0 = const()[name = tensor("current_value_7_pad_type_0"), val = tensor("custom")]; tensor current_value_7_pad_0 = const()[name = tensor("current_value_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_3_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(196582976))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(197402240))), name = tensor("layers_3_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_3_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_3_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(197402368)))]; tensor current_value_7_cast_fp16 = conv(bias = layers_3_self_attn_v_proj_bias_to_fp16, dilations = var_875, groups = var_825, pad = current_value_7_pad_0, pad_type = current_value_7_pad_type_0, strides = var_873, weight = layers_3_self_attn_v_proj_weight_to_fp16_palettized, x = obj_37_cast_fp16)[name = tensor("current_value_7_cast_fp16")]; tensor var_882_cast_fp16 = mul(x = current_key_7_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_882_cast_fp16")]; tensor var_884_cast_fp16 = mul(x = var_103_cast_fp16_3, y = var_241_cast_fp16)[name = tensor("op_884_cast_fp16")]; tensor key_13_cast_fp16 = add(x = var_882_cast_fp16, y = var_884_cast_fp16)[name = tensor("key_13_cast_fp16")]; tensor var_886_cast_fp16 = mul(x = current_value_7_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_886_cast_fp16")]; tensor var_888_cast_fp16 = mul(x = var_138_cast_fp16_3, y = var_241_cast_fp16)[name = tensor("op_888_cast_fp16")]; tensor value_13_cast_fp16 = add(x = var_886_cast_fp16, y = var_888_cast_fp16)[name = tensor("value_13_cast_fp16")]; tensor var_891 = const()[name = tensor("op_891"), val = tensor([1, 20, 64, -1])]; tensor var_892_cast_fp16 = reshape(shape = var_891, x = query_13_cast_fp16)[name = tensor("op_892_cast_fp16")]; tensor var_893_to_fp16 = const()[name = tensor("op_893_to_fp16"), val = tensor(0x1p-3)]; tensor var_894_cast_fp16 = mul(x = var_892_cast_fp16, y = var_893_to_fp16)[name = tensor("op_894_cast_fp16")]; tensor var_895 = const()[name = tensor("op_895"), val = tensor([1, 20, 64, -1])]; tensor var_896_cast_fp16 = reshape(shape = var_895, x = key_13_cast_fp16)[name = tensor("op_896_cast_fp16")]; tensor mh_w_19_transpose_x_0 = const()[name = tensor("mh_w_19_transpose_x_0"), val = tensor(true)]; tensor mh_w_19_transpose_y_0 = const()[name = tensor("mh_w_19_transpose_y_0"), val = tensor(false)]; tensor mh_w_19_cast_fp16 = matmul(transpose_x = mh_w_19_transpose_x_0, transpose_y = mh_w_19_transpose_y_0, x = var_894_cast_fp16, y = var_896_cast_fp16)[name = tensor("mh_w_19_cast_fp16")]; tensor mh_w_21_cast_fp16 = add(x = mh_w_19_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_21_cast_fp16")]; tensor var_904_cast_fp16 = softmax(axis = var_818, x = mh_w_21_cast_fp16)[name = tensor("op_904_cast_fp16")]; tensor var_905 = const()[name = tensor("op_905"), val = tensor([1, 20, 64, -1])]; tensor var_906_cast_fp16 = reshape(shape = var_905, x = value_13_cast_fp16)[name = tensor("op_906_cast_fp16")]; tensor attn_13_transpose_x_0 = const()[name = tensor("attn_13_transpose_x_0"), val = tensor(false)]; tensor attn_13_transpose_y_0 = const()[name = tensor("attn_13_transpose_y_0"), val = tensor(true)]; tensor attn_13_cast_fp16 = matmul(transpose_x = attn_13_transpose_x_0, transpose_y = attn_13_transpose_y_0, x = var_906_cast_fp16, y = var_904_cast_fp16)[name = tensor("attn_13_cast_fp16")]; tensor var_909 = const()[name = tensor("op_909"), val = tensor([1, 1280, 1, -1])]; tensor input_31_cast_fp16 = reshape(shape = var_909, x = attn_13_cast_fp16)[name = tensor("input_31_cast_fp16")]; tensor var_913 = const()[name = tensor("op_913"), val = tensor([1, 1])]; tensor var_915 = const()[name = tensor("op_915"), val = tensor([1, 1])]; tensor obj_43_pad_type_0 = const()[name = tensor("obj_43_pad_type_0"), val = tensor("custom")]; tensor obj_43_pad_0 = const()[name = tensor("obj_43_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_3_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(197404992))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198633856))), name = tensor("layers_3_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_3_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_3_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198634048)))]; tensor obj_43_cast_fp16 = conv(bias = layers_3_self_attn_o_proj_bias_to_fp16, dilations = var_915, groups = var_825, pad = obj_43_pad_0, pad_type = obj_43_pad_type_0, strides = var_913, weight = layers_3_self_attn_o_proj_weight_to_fp16_palettized, x = input_31_cast_fp16)[name = tensor("obj_43_cast_fp16")]; tensor inputs_21_cast_fp16 = add(x = inputs_19_cast_fp16, y = obj_43_cast_fp16)[name = tensor("inputs_21_cast_fp16")]; tensor var_925 = const()[name = tensor("op_925"), val = tensor([1])]; tensor channels_mean_21_cast_fp16 = reduce_mean(axes = var_925, keep_dims = var_826, x = inputs_21_cast_fp16)[name = tensor("channels_mean_21_cast_fp16")]; tensor zero_mean_21_cast_fp16 = sub(x = inputs_21_cast_fp16, y = channels_mean_21_cast_fp16)[name = tensor("zero_mean_21_cast_fp16")]; tensor zero_mean_sq_21_cast_fp16 = mul(x = zero_mean_21_cast_fp16, y = zero_mean_21_cast_fp16)[name = tensor("zero_mean_sq_21_cast_fp16")]; tensor var_929 = const()[name = tensor("op_929"), val = tensor([1])]; tensor var_930_cast_fp16 = reduce_mean(axes = var_929, keep_dims = var_826, x = zero_mean_sq_21_cast_fp16)[name = tensor("op_930_cast_fp16")]; tensor var_931_to_fp16 = const()[name = tensor("op_931_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_932_cast_fp16 = add(x = var_930_cast_fp16, y = var_931_to_fp16)[name = tensor("op_932_cast_fp16")]; tensor denom_21_epsilon_0 = const()[name = tensor("denom_21_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_21_cast_fp16 = rsqrt(epsilon = denom_21_epsilon_0, x = var_932_cast_fp16)[name = tensor("denom_21_cast_fp16")]; tensor out_21_cast_fp16 = mul(x = zero_mean_21_cast_fp16, y = denom_21_cast_fp16)[name = tensor("out_21_cast_fp16")]; tensor obj_45_gamma_0_to_fp16 = const()[name = tensor("obj_45_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198636672)))]; tensor obj_45_beta_0_to_fp16 = const()[name = tensor("obj_45_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198639296)))]; tensor obj_45_epsilon_0_to_fp16 = const()[name = tensor("obj_45_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_45_cast_fp16 = batch_norm(beta = obj_45_beta_0_to_fp16, epsilon = obj_45_epsilon_0_to_fp16, gamma = obj_45_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_21_cast_fp16)[name = tensor("obj_45_cast_fp16")]; tensor var_947 = const()[name = tensor("op_947"), val = tensor([1, 1])]; tensor var_949 = const()[name = tensor("op_949"), val = tensor([1, 1])]; tensor query_15_pad_type_0 = const()[name = tensor("query_15_pad_type_0"), val = tensor("custom")]; tensor query_15_pad_0 = const()[name = tensor("query_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_3_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(198641920))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(199461184))), name = tensor("layers_3_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_3_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_3_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(199461312)))]; tensor query_15_cast_fp16 = conv(bias = layers_3_encoder_attn_q_proj_bias_to_fp16, dilations = var_949, groups = var_825, pad = query_15_pad_0, pad_type = query_15_pad_type_0, strides = var_947, weight = layers_3_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_45_cast_fp16)[name = tensor("query_15_cast_fp16")]; tensor var_953 = const()[name = tensor("op_953"), val = tensor([1, 1])]; tensor var_955 = const()[name = tensor("op_955"), val = tensor([1, 1])]; tensor key_15_pad_type_0 = const()[name = tensor("key_15_pad_type_0"), val = tensor("custom")]; tensor key_15_pad_0 = const()[name = tensor("key_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_3_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(199463936))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(200692800))), name = tensor("layers_3_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_15_cast_fp16 = conv(dilations = var_955, groups = var_825, pad = key_15_pad_0, pad_type = key_15_pad_type_0, strides = var_953, weight = layers_3_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_15_cast_fp16")]; tensor var_960 = const()[name = tensor("op_960"), val = tensor([1, 1])]; tensor var_962 = const()[name = tensor("op_962"), val = tensor([1, 1])]; tensor value_15_pad_type_0 = const()[name = tensor("value_15_pad_type_0"), val = tensor("custom")]; tensor value_15_pad_0 = const()[name = tensor("value_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_3_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(200692992))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201512256))), name = tensor("layers_3_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_3_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_3_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201512384)))]; tensor value_15_cast_fp16 = conv(bias = layers_3_encoder_attn_v_proj_bias_to_fp16, dilations = var_962, groups = var_825, pad = value_15_pad_0, pad_type = value_15_pad_type_0, strides = var_960, weight = layers_3_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_15_cast_fp16")]; tensor var_966 = const()[name = tensor("op_966"), val = tensor([1, 20, 64, -1])]; tensor var_967_cast_fp16 = reshape(shape = var_966, x = query_15_cast_fp16)[name = tensor("op_967_cast_fp16")]; tensor var_968_to_fp16 = const()[name = tensor("op_968_to_fp16"), val = tensor(0x1p-3)]; tensor var_969_cast_fp16 = mul(x = var_967_cast_fp16, y = var_968_to_fp16)[name = tensor("op_969_cast_fp16")]; tensor var_970 = const()[name = tensor("op_970"), val = tensor([1, 20, 64, -1])]; tensor var_971_cast_fp16 = reshape(shape = var_970, x = key_15_cast_fp16)[name = tensor("op_971_cast_fp16")]; tensor mh_w_23_transpose_x_0 = const()[name = tensor("mh_w_23_transpose_x_0"), val = tensor(true)]; tensor mh_w_23_transpose_y_0 = const()[name = tensor("mh_w_23_transpose_y_0"), val = tensor(false)]; tensor mh_w_23_cast_fp16 = matmul(transpose_x = mh_w_23_transpose_x_0, transpose_y = mh_w_23_transpose_y_0, x = var_969_cast_fp16, y = var_971_cast_fp16)[name = tensor("mh_w_23_cast_fp16")]; tensor var_974_cast_fp16 = softmax(axis = var_818, x = mh_w_23_cast_fp16)[name = tensor("op_974_cast_fp16")]; tensor var_975 = const()[name = tensor("op_975"), val = tensor([1, 20, 64, -1])]; tensor var_976_cast_fp16 = reshape(shape = var_975, x = value_15_cast_fp16)[name = tensor("op_976_cast_fp16")]; tensor attn_15_transpose_x_0 = const()[name = tensor("attn_15_transpose_x_0"), val = tensor(false)]; tensor attn_15_transpose_y_0 = const()[name = tensor("attn_15_transpose_y_0"), val = tensor(true)]; tensor attn_15_cast_fp16 = matmul(transpose_x = attn_15_transpose_x_0, transpose_y = attn_15_transpose_y_0, x = var_976_cast_fp16, y = var_974_cast_fp16)[name = tensor("attn_15_cast_fp16")]; tensor var_979 = const()[name = tensor("op_979"), val = tensor([1, 1280, 1, -1])]; tensor input_33_cast_fp16 = reshape(shape = var_979, x = attn_15_cast_fp16)[name = tensor("input_33_cast_fp16")]; tensor var_983 = const()[name = tensor("op_983"), val = tensor([1, 1])]; tensor var_985 = const()[name = tensor("op_985"), val = tensor([1, 1])]; tensor obj_47_pad_type_0 = const()[name = tensor("obj_47_pad_type_0"), val = tensor("custom")]; tensor obj_47_pad_0 = const()[name = tensor("obj_47_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_3_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201515008))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202743872))), name = tensor("layers_3_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_3_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_3_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202744064)))]; tensor obj_47_cast_fp16 = conv(bias = layers_3_encoder_attn_o_proj_bias_to_fp16, dilations = var_985, groups = var_825, pad = obj_47_pad_0, pad_type = obj_47_pad_type_0, strides = var_983, weight = layers_3_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_33_cast_fp16)[name = tensor("obj_47_cast_fp16")]; tensor inputs_23_cast_fp16 = add(x = inputs_21_cast_fp16, y = obj_47_cast_fp16)[name = tensor("inputs_23_cast_fp16")]; tensor var_991 = const()[name = tensor("op_991"), val = tensor([1])]; tensor channels_mean_23_cast_fp16 = reduce_mean(axes = var_991, keep_dims = var_826, x = inputs_23_cast_fp16)[name = tensor("channels_mean_23_cast_fp16")]; tensor zero_mean_23_cast_fp16 = sub(x = inputs_23_cast_fp16, y = channels_mean_23_cast_fp16)[name = tensor("zero_mean_23_cast_fp16")]; tensor zero_mean_sq_23_cast_fp16 = mul(x = zero_mean_23_cast_fp16, y = zero_mean_23_cast_fp16)[name = tensor("zero_mean_sq_23_cast_fp16")]; tensor var_995 = const()[name = tensor("op_995"), val = tensor([1])]; tensor var_996_cast_fp16 = reduce_mean(axes = var_995, keep_dims = var_826, x = zero_mean_sq_23_cast_fp16)[name = tensor("op_996_cast_fp16")]; tensor var_997_to_fp16 = const()[name = tensor("op_997_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_998_cast_fp16 = add(x = var_996_cast_fp16, y = var_997_to_fp16)[name = tensor("op_998_cast_fp16")]; tensor denom_23_epsilon_0 = const()[name = tensor("denom_23_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_23_cast_fp16 = rsqrt(epsilon = denom_23_epsilon_0, x = var_998_cast_fp16)[name = tensor("denom_23_cast_fp16")]; tensor out_23_cast_fp16 = mul(x = zero_mean_23_cast_fp16, y = denom_23_cast_fp16)[name = tensor("out_23_cast_fp16")]; tensor input_35_gamma_0_to_fp16 = const()[name = tensor("input_35_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202746688)))]; tensor input_35_beta_0_to_fp16 = const()[name = tensor("input_35_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202749312)))]; tensor input_35_epsilon_0_to_fp16 = const()[name = tensor("input_35_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_35_cast_fp16 = batch_norm(beta = input_35_beta_0_to_fp16, epsilon = input_35_epsilon_0_to_fp16, gamma = input_35_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_23_cast_fp16)[name = tensor("input_35_cast_fp16")]; tensor var_1009 = const()[name = tensor("op_1009"), val = tensor([1, 1])]; tensor var_1011 = const()[name = tensor("op_1011"), val = tensor([1, 1])]; tensor input_37_pad_type_0 = const()[name = tensor("input_37_pad_type_0"), val = tensor("custom")]; tensor input_37_pad_0 = const()[name = tensor("input_37_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_3_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(202751936))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(207667200))), name = tensor("layers_3_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_3_fc1_bias_to_fp16 = const()[name = tensor("layers_3_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(207667392)))]; tensor input_37_cast_fp16 = conv(bias = layers_3_fc1_bias_to_fp16, dilations = var_1011, groups = var_825, pad = input_37_pad_0, pad_type = input_37_pad_type_0, strides = var_1009, weight = layers_3_fc1_weight_to_fp16_palettized, x = input_35_cast_fp16)[name = tensor("input_37_cast_fp16")]; tensor input_39_mode_0 = const()[name = tensor("input_39_mode_0"), val = tensor("EXACT")]; tensor input_39_cast_fp16 = gelu(mode = input_39_mode_0, x = input_37_cast_fp16)[name = tensor("input_39_cast_fp16")]; tensor var_1017 = const()[name = tensor("op_1017"), val = tensor([1, 1])]; tensor var_1019 = const()[name = tensor("op_1019"), val = tensor([1, 1])]; tensor hidden_states_9_pad_type_0 = const()[name = tensor("hidden_states_9_pad_type_0"), val = tensor("custom")]; tensor hidden_states_9_pad_0 = const()[name = tensor("hidden_states_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_3_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(207677696))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214231360))), name = tensor("layers_3_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_3_fc2_bias_to_fp16 = const()[name = tensor("layers_3_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214231936)))]; tensor hidden_states_9_cast_fp16 = conv(bias = layers_3_fc2_bias_to_fp16, dilations = var_1019, groups = var_825, pad = hidden_states_9_pad_0, pad_type = hidden_states_9_pad_type_0, strides = var_1017, weight = layers_3_fc2_weight_to_fp16_palettized, x = input_39_cast_fp16)[name = tensor("hidden_states_9_cast_fp16")]; tensor inputs_25_cast_fp16 = add(x = inputs_23_cast_fp16, y = hidden_states_9_cast_fp16)[name = tensor("inputs_25_cast_fp16")]; tensor var_1032 = const()[name = tensor("op_1032"), val = tensor(3)]; tensor var_1039 = const()[name = tensor("op_1039"), val = tensor(1)]; tensor var_1040 = const()[name = tensor("op_1040"), val = tensor(true)]; tensor var_1052 = const()[name = tensor("op_1052"), val = tensor([1])]; tensor channels_mean_25_cast_fp16 = reduce_mean(axes = var_1052, keep_dims = var_1040, x = inputs_25_cast_fp16)[name = tensor("channels_mean_25_cast_fp16")]; tensor zero_mean_25_cast_fp16 = sub(x = inputs_25_cast_fp16, y = channels_mean_25_cast_fp16)[name = tensor("zero_mean_25_cast_fp16")]; tensor zero_mean_sq_25_cast_fp16 = mul(x = zero_mean_25_cast_fp16, y = zero_mean_25_cast_fp16)[name = tensor("zero_mean_sq_25_cast_fp16")]; tensor var_1056 = const()[name = tensor("op_1056"), val = tensor([1])]; tensor var_1057_cast_fp16 = reduce_mean(axes = var_1056, keep_dims = var_1040, x = zero_mean_sq_25_cast_fp16)[name = tensor("op_1057_cast_fp16")]; tensor var_1058_to_fp16 = const()[name = tensor("op_1058_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1059_cast_fp16 = add(x = var_1057_cast_fp16, y = var_1058_to_fp16)[name = tensor("op_1059_cast_fp16")]; tensor denom_25_epsilon_0 = const()[name = tensor("denom_25_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_25_cast_fp16 = rsqrt(epsilon = denom_25_epsilon_0, x = var_1059_cast_fp16)[name = tensor("denom_25_cast_fp16")]; tensor out_25_cast_fp16 = mul(x = zero_mean_25_cast_fp16, y = denom_25_cast_fp16)[name = tensor("out_25_cast_fp16")]; tensor obj_49_gamma_0_to_fp16 = const()[name = tensor("obj_49_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214234560)))]; tensor obj_49_beta_0_to_fp16 = const()[name = tensor("obj_49_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214237184)))]; tensor obj_49_epsilon_0_to_fp16 = const()[name = tensor("obj_49_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_49_cast_fp16 = batch_norm(beta = obj_49_beta_0_to_fp16, epsilon = obj_49_epsilon_0_to_fp16, gamma = obj_49_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_25_cast_fp16)[name = tensor("obj_49_cast_fp16")]; tensor var_1074 = const()[name = tensor("op_1074"), val = tensor([1, 1])]; tensor var_1076 = const()[name = tensor("op_1076"), val = tensor([1, 1])]; tensor query_17_pad_type_0 = const()[name = tensor("query_17_pad_type_0"), val = tensor("custom")]; tensor query_17_pad_0 = const()[name = tensor("query_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_4_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214239808))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215468672))), name = tensor("layers_4_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_4_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_4_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215468864)))]; tensor query_17_cast_fp16 = conv(bias = layers_4_self_attn_q_proj_bias_to_fp16, dilations = var_1076, groups = var_1039, pad = query_17_pad_0, pad_type = query_17_pad_type_0, strides = var_1074, weight = layers_4_self_attn_q_proj_weight_to_fp16_palettized, x = obj_49_cast_fp16)[name = tensor("query_17_cast_fp16")]; tensor var_1080 = const()[name = tensor("op_1080"), val = tensor([1, 1])]; tensor var_1082 = const()[name = tensor("op_1082"), val = tensor([1, 1])]; tensor current_key_9_pad_type_0 = const()[name = tensor("current_key_9_pad_type_0"), val = tensor("custom")]; tensor current_key_9_pad_0 = const()[name = tensor("current_key_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_4_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215471488))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(216290752))), name = tensor("layers_4_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_9_cast_fp16 = conv(dilations = var_1082, groups = var_1039, pad = current_key_9_pad_0, pad_type = current_key_9_pad_type_0, strides = var_1080, weight = layers_4_self_attn_k_proj_weight_to_fp16_palettized, x = obj_49_cast_fp16)[name = tensor("current_key_9_cast_fp16")]; tensor var_1087 = const()[name = tensor("op_1087"), val = tensor([1, 1])]; tensor var_1089 = const()[name = tensor("op_1089"), val = tensor([1, 1])]; tensor current_value_9_pad_type_0 = const()[name = tensor("current_value_9_pad_type_0"), val = tensor("custom")]; tensor current_value_9_pad_0 = const()[name = tensor("current_value_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_4_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(216290880))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217519744))), name = tensor("layers_4_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_4_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_4_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217519936)))]; tensor current_value_9_cast_fp16 = conv(bias = layers_4_self_attn_v_proj_bias_to_fp16, dilations = var_1089, groups = var_1039, pad = current_value_9_pad_0, pad_type = current_value_9_pad_type_0, strides = var_1087, weight = layers_4_self_attn_v_proj_weight_to_fp16_palettized, x = obj_49_cast_fp16)[name = tensor("current_value_9_cast_fp16")]; tensor var_1096_cast_fp16 = mul(x = current_key_9_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_1096_cast_fp16")]; tensor var_1098_cast_fp16 = mul(x = var_103_cast_fp16_4, y = var_241_cast_fp16)[name = tensor("op_1098_cast_fp16")]; tensor key_17_cast_fp16 = add(x = var_1096_cast_fp16, y = var_1098_cast_fp16)[name = tensor("key_17_cast_fp16")]; tensor var_1100_cast_fp16 = mul(x = current_value_9_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_1100_cast_fp16")]; tensor var_1102_cast_fp16 = mul(x = var_138_cast_fp16_4, y = var_241_cast_fp16)[name = tensor("op_1102_cast_fp16")]; tensor value_17_cast_fp16 = add(x = var_1100_cast_fp16, y = var_1102_cast_fp16)[name = tensor("value_17_cast_fp16")]; tensor var_1105 = const()[name = tensor("op_1105"), val = tensor([1, 20, 64, -1])]; tensor var_1106_cast_fp16 = reshape(shape = var_1105, x = query_17_cast_fp16)[name = tensor("op_1106_cast_fp16")]; tensor var_1107_to_fp16 = const()[name = tensor("op_1107_to_fp16"), val = tensor(0x1p-3)]; tensor var_1108_cast_fp16 = mul(x = var_1106_cast_fp16, y = var_1107_to_fp16)[name = tensor("op_1108_cast_fp16")]; tensor var_1109 = const()[name = tensor("op_1109"), val = tensor([1, 20, 64, -1])]; tensor var_1110_cast_fp16 = reshape(shape = var_1109, x = key_17_cast_fp16)[name = tensor("op_1110_cast_fp16")]; tensor mh_w_25_transpose_x_0 = const()[name = tensor("mh_w_25_transpose_x_0"), val = tensor(true)]; tensor mh_w_25_transpose_y_0 = const()[name = tensor("mh_w_25_transpose_y_0"), val = tensor(false)]; tensor mh_w_25_cast_fp16 = matmul(transpose_x = mh_w_25_transpose_x_0, transpose_y = mh_w_25_transpose_y_0, x = var_1108_cast_fp16, y = var_1110_cast_fp16)[name = tensor("mh_w_25_cast_fp16")]; tensor mh_w_27_cast_fp16 = add(x = mh_w_25_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_27_cast_fp16")]; tensor var_1118_cast_fp16 = softmax(axis = var_1032, x = mh_w_27_cast_fp16)[name = tensor("op_1118_cast_fp16")]; tensor var_1119 = const()[name = tensor("op_1119"), val = tensor([1, 20, 64, -1])]; tensor var_1120_cast_fp16 = reshape(shape = var_1119, x = value_17_cast_fp16)[name = tensor("op_1120_cast_fp16")]; tensor attn_17_transpose_x_0 = const()[name = tensor("attn_17_transpose_x_0"), val = tensor(false)]; tensor attn_17_transpose_y_0 = const()[name = tensor("attn_17_transpose_y_0"), val = tensor(true)]; tensor attn_17_cast_fp16 = matmul(transpose_x = attn_17_transpose_x_0, transpose_y = attn_17_transpose_y_0, x = var_1120_cast_fp16, y = var_1118_cast_fp16)[name = tensor("attn_17_cast_fp16")]; tensor var_1123 = const()[name = tensor("op_1123"), val = tensor([1, 1280, 1, -1])]; tensor input_41_cast_fp16 = reshape(shape = var_1123, x = attn_17_cast_fp16)[name = tensor("input_41_cast_fp16")]; tensor var_1127 = const()[name = tensor("op_1127"), val = tensor([1, 1])]; tensor var_1129 = const()[name = tensor("op_1129"), val = tensor([1, 1])]; tensor obj_55_pad_type_0 = const()[name = tensor("obj_55_pad_type_0"), val = tensor("custom")]; tensor obj_55_pad_0 = const()[name = tensor("obj_55_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_4_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217522560))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218751424))), name = tensor("layers_4_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_4_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_4_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218751616)))]; tensor obj_55_cast_fp16 = conv(bias = layers_4_self_attn_o_proj_bias_to_fp16, dilations = var_1129, groups = var_1039, pad = obj_55_pad_0, pad_type = obj_55_pad_type_0, strides = var_1127, weight = layers_4_self_attn_o_proj_weight_to_fp16_palettized, x = input_41_cast_fp16)[name = tensor("obj_55_cast_fp16")]; tensor inputs_27_cast_fp16 = add(x = inputs_25_cast_fp16, y = obj_55_cast_fp16)[name = tensor("inputs_27_cast_fp16")]; tensor var_1139 = const()[name = tensor("op_1139"), val = tensor([1])]; tensor channels_mean_27_cast_fp16 = reduce_mean(axes = var_1139, keep_dims = var_1040, x = inputs_27_cast_fp16)[name = tensor("channels_mean_27_cast_fp16")]; tensor zero_mean_27_cast_fp16 = sub(x = inputs_27_cast_fp16, y = channels_mean_27_cast_fp16)[name = tensor("zero_mean_27_cast_fp16")]; tensor zero_mean_sq_27_cast_fp16 = mul(x = zero_mean_27_cast_fp16, y = zero_mean_27_cast_fp16)[name = tensor("zero_mean_sq_27_cast_fp16")]; tensor var_1143 = const()[name = tensor("op_1143"), val = tensor([1])]; tensor var_1144_cast_fp16 = reduce_mean(axes = var_1143, keep_dims = var_1040, x = zero_mean_sq_27_cast_fp16)[name = tensor("op_1144_cast_fp16")]; tensor var_1145_to_fp16 = const()[name = tensor("op_1145_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1146_cast_fp16 = add(x = var_1144_cast_fp16, y = var_1145_to_fp16)[name = tensor("op_1146_cast_fp16")]; tensor denom_27_epsilon_0 = const()[name = tensor("denom_27_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_27_cast_fp16 = rsqrt(epsilon = denom_27_epsilon_0, x = var_1146_cast_fp16)[name = tensor("denom_27_cast_fp16")]; tensor out_27_cast_fp16 = mul(x = zero_mean_27_cast_fp16, y = denom_27_cast_fp16)[name = tensor("out_27_cast_fp16")]; tensor obj_57_gamma_0_to_fp16 = const()[name = tensor("obj_57_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218754240)))]; tensor obj_57_beta_0_to_fp16 = const()[name = tensor("obj_57_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218756864)))]; tensor obj_57_epsilon_0_to_fp16 = const()[name = tensor("obj_57_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_57_cast_fp16 = batch_norm(beta = obj_57_beta_0_to_fp16, epsilon = obj_57_epsilon_0_to_fp16, gamma = obj_57_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_27_cast_fp16)[name = tensor("obj_57_cast_fp16")]; tensor var_1161 = const()[name = tensor("op_1161"), val = tensor([1, 1])]; tensor var_1163 = const()[name = tensor("op_1163"), val = tensor([1, 1])]; tensor query_19_pad_type_0 = const()[name = tensor("query_19_pad_type_0"), val = tensor("custom")]; tensor query_19_pad_0 = const()[name = tensor("query_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_4_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218759488))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219578752))), name = tensor("layers_4_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_4_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_4_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219578880)))]; tensor query_19_cast_fp16 = conv(bias = layers_4_encoder_attn_q_proj_bias_to_fp16, dilations = var_1163, groups = var_1039, pad = query_19_pad_0, pad_type = query_19_pad_type_0, strides = var_1161, weight = layers_4_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_57_cast_fp16)[name = tensor("query_19_cast_fp16")]; tensor var_1167 = const()[name = tensor("op_1167"), val = tensor([1, 1])]; tensor var_1169 = const()[name = tensor("op_1169"), val = tensor([1, 1])]; tensor key_19_pad_type_0 = const()[name = tensor("key_19_pad_type_0"), val = tensor("custom")]; tensor key_19_pad_0 = const()[name = tensor("key_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_4_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219581504))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220810368))), name = tensor("layers_4_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_19_cast_fp16 = conv(dilations = var_1169, groups = var_1039, pad = key_19_pad_0, pad_type = key_19_pad_type_0, strides = var_1167, weight = layers_4_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_19_cast_fp16")]; tensor var_1174 = const()[name = tensor("op_1174"), val = tensor([1, 1])]; tensor var_1176 = const()[name = tensor("op_1176"), val = tensor([1, 1])]; tensor value_19_pad_type_0 = const()[name = tensor("value_19_pad_type_0"), val = tensor("custom")]; tensor value_19_pad_0 = const()[name = tensor("value_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_4_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220810560))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(222039424))), name = tensor("layers_4_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_4_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_4_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(222039616)))]; tensor value_19_cast_fp16 = conv(bias = layers_4_encoder_attn_v_proj_bias_to_fp16, dilations = var_1176, groups = var_1039, pad = value_19_pad_0, pad_type = value_19_pad_type_0, strides = var_1174, weight = layers_4_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_19_cast_fp16")]; tensor var_1180 = const()[name = tensor("op_1180"), val = tensor([1, 20, 64, -1])]; tensor var_1181_cast_fp16 = reshape(shape = var_1180, x = query_19_cast_fp16)[name = tensor("op_1181_cast_fp16")]; tensor var_1182_to_fp16 = const()[name = tensor("op_1182_to_fp16"), val = tensor(0x1p-3)]; tensor var_1183_cast_fp16 = mul(x = var_1181_cast_fp16, y = var_1182_to_fp16)[name = tensor("op_1183_cast_fp16")]; tensor var_1184 = const()[name = tensor("op_1184"), val = tensor([1, 20, 64, -1])]; tensor var_1185_cast_fp16 = reshape(shape = var_1184, x = key_19_cast_fp16)[name = tensor("op_1185_cast_fp16")]; tensor mh_w_29_transpose_x_0 = const()[name = tensor("mh_w_29_transpose_x_0"), val = tensor(true)]; tensor mh_w_29_transpose_y_0 = const()[name = tensor("mh_w_29_transpose_y_0"), val = tensor(false)]; tensor mh_w_29_cast_fp16 = matmul(transpose_x = mh_w_29_transpose_x_0, transpose_y = mh_w_29_transpose_y_0, x = var_1183_cast_fp16, y = var_1185_cast_fp16)[name = tensor("mh_w_29_cast_fp16")]; tensor var_1188_cast_fp16 = softmax(axis = var_1032, x = mh_w_29_cast_fp16)[name = tensor("op_1188_cast_fp16")]; tensor var_1189 = const()[name = tensor("op_1189"), val = tensor([1, 20, 64, -1])]; tensor var_1190_cast_fp16 = reshape(shape = var_1189, x = value_19_cast_fp16)[name = tensor("op_1190_cast_fp16")]; tensor attn_19_transpose_x_0 = const()[name = tensor("attn_19_transpose_x_0"), val = tensor(false)]; tensor attn_19_transpose_y_0 = const()[name = tensor("attn_19_transpose_y_0"), val = tensor(true)]; tensor attn_19_cast_fp16 = matmul(transpose_x = attn_19_transpose_x_0, transpose_y = attn_19_transpose_y_0, x = var_1190_cast_fp16, y = var_1188_cast_fp16)[name = tensor("attn_19_cast_fp16")]; tensor var_1193 = const()[name = tensor("op_1193"), val = tensor([1, 1280, 1, -1])]; tensor input_43_cast_fp16 = reshape(shape = var_1193, x = attn_19_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor var_1197 = const()[name = tensor("op_1197"), val = tensor([1, 1])]; tensor var_1199 = const()[name = tensor("op_1199"), val = tensor([1, 1])]; tensor obj_59_pad_type_0 = const()[name = tensor("obj_59_pad_type_0"), val = tensor("custom")]; tensor obj_59_pad_0 = const()[name = tensor("obj_59_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_4_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(222042240))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(223271104))), name = tensor("layers_4_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_4_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_4_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(223271296)))]; tensor obj_59_cast_fp16 = conv(bias = layers_4_encoder_attn_o_proj_bias_to_fp16, dilations = var_1199, groups = var_1039, pad = obj_59_pad_0, pad_type = obj_59_pad_type_0, strides = var_1197, weight = layers_4_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_43_cast_fp16)[name = tensor("obj_59_cast_fp16")]; tensor inputs_29_cast_fp16 = add(x = inputs_27_cast_fp16, y = obj_59_cast_fp16)[name = tensor("inputs_29_cast_fp16")]; tensor var_1205 = const()[name = tensor("op_1205"), val = tensor([1])]; tensor channels_mean_29_cast_fp16 = reduce_mean(axes = var_1205, keep_dims = var_1040, x = inputs_29_cast_fp16)[name = tensor("channels_mean_29_cast_fp16")]; tensor zero_mean_29_cast_fp16 = sub(x = inputs_29_cast_fp16, y = channels_mean_29_cast_fp16)[name = tensor("zero_mean_29_cast_fp16")]; tensor zero_mean_sq_29_cast_fp16 = mul(x = zero_mean_29_cast_fp16, y = zero_mean_29_cast_fp16)[name = tensor("zero_mean_sq_29_cast_fp16")]; tensor var_1209 = const()[name = tensor("op_1209"), val = tensor([1])]; tensor var_1210_cast_fp16 = reduce_mean(axes = var_1209, keep_dims = var_1040, x = zero_mean_sq_29_cast_fp16)[name = tensor("op_1210_cast_fp16")]; tensor var_1211_to_fp16 = const()[name = tensor("op_1211_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1212_cast_fp16 = add(x = var_1210_cast_fp16, y = var_1211_to_fp16)[name = tensor("op_1212_cast_fp16")]; tensor denom_29_epsilon_0 = const()[name = tensor("denom_29_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_29_cast_fp16 = rsqrt(epsilon = denom_29_epsilon_0, x = var_1212_cast_fp16)[name = tensor("denom_29_cast_fp16")]; tensor out_29_cast_fp16 = mul(x = zero_mean_29_cast_fp16, y = denom_29_cast_fp16)[name = tensor("out_29_cast_fp16")]; tensor input_45_gamma_0_to_fp16 = const()[name = tensor("input_45_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(223273920)))]; tensor input_45_beta_0_to_fp16 = const()[name = tensor("input_45_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(223276544)))]; tensor input_45_epsilon_0_to_fp16 = const()[name = tensor("input_45_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_45_cast_fp16 = batch_norm(beta = input_45_beta_0_to_fp16, epsilon = input_45_epsilon_0_to_fp16, gamma = input_45_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_29_cast_fp16)[name = tensor("input_45_cast_fp16")]; tensor var_1223 = const()[name = tensor("op_1223"), val = tensor([1, 1])]; tensor var_1225 = const()[name = tensor("op_1225"), val = tensor([1, 1])]; tensor input_47_pad_type_0 = const()[name = tensor("input_47_pad_type_0"), val = tensor("custom")]; tensor input_47_pad_0 = const()[name = tensor("input_47_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_4_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(223279168))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(228194432))), name = tensor("layers_4_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_4_fc1_bias_to_fp16 = const()[name = tensor("layers_4_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(228194624)))]; tensor input_47_cast_fp16 = conv(bias = layers_4_fc1_bias_to_fp16, dilations = var_1225, groups = var_1039, pad = input_47_pad_0, pad_type = input_47_pad_type_0, strides = var_1223, weight = layers_4_fc1_weight_to_fp16_palettized, x = input_45_cast_fp16)[name = tensor("input_47_cast_fp16")]; tensor input_49_mode_0 = const()[name = tensor("input_49_mode_0"), val = tensor("EXACT")]; tensor input_49_cast_fp16 = gelu(mode = input_49_mode_0, x = input_47_cast_fp16)[name = tensor("input_49_cast_fp16")]; tensor var_1231 = const()[name = tensor("op_1231"), val = tensor([1, 1])]; tensor var_1233 = const()[name = tensor("op_1233"), val = tensor([1, 1])]; tensor hidden_states_11_pad_type_0 = const()[name = tensor("hidden_states_11_pad_type_0"), val = tensor("custom")]; tensor hidden_states_11_pad_0 = const()[name = tensor("hidden_states_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_4_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(228204928))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(233120192))), name = tensor("layers_4_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_4_fc2_bias_to_fp16 = const()[name = tensor("layers_4_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(233120384)))]; tensor hidden_states_11_cast_fp16 = conv(bias = layers_4_fc2_bias_to_fp16, dilations = var_1233, groups = var_1039, pad = hidden_states_11_pad_0, pad_type = hidden_states_11_pad_type_0, strides = var_1231, weight = layers_4_fc2_weight_to_fp16_palettized, x = input_49_cast_fp16)[name = tensor("hidden_states_11_cast_fp16")]; tensor inputs_31_cast_fp16 = add(x = inputs_29_cast_fp16, y = hidden_states_11_cast_fp16)[name = tensor("inputs_31_cast_fp16")]; tensor var_1246 = const()[name = tensor("op_1246"), val = tensor(3)]; tensor var_1253 = const()[name = tensor("op_1253"), val = tensor(1)]; tensor var_1254 = const()[name = tensor("op_1254"), val = tensor(true)]; tensor var_1266 = const()[name = tensor("op_1266"), val = tensor([1])]; tensor channels_mean_31_cast_fp16 = reduce_mean(axes = var_1266, keep_dims = var_1254, x = inputs_31_cast_fp16)[name = tensor("channels_mean_31_cast_fp16")]; tensor zero_mean_31_cast_fp16 = sub(x = inputs_31_cast_fp16, y = channels_mean_31_cast_fp16)[name = tensor("zero_mean_31_cast_fp16")]; tensor zero_mean_sq_31_cast_fp16 = mul(x = zero_mean_31_cast_fp16, y = zero_mean_31_cast_fp16)[name = tensor("zero_mean_sq_31_cast_fp16")]; tensor var_1270 = const()[name = tensor("op_1270"), val = tensor([1])]; tensor var_1271_cast_fp16 = reduce_mean(axes = var_1270, keep_dims = var_1254, x = zero_mean_sq_31_cast_fp16)[name = tensor("op_1271_cast_fp16")]; tensor var_1272_to_fp16 = const()[name = tensor("op_1272_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1273_cast_fp16 = add(x = var_1271_cast_fp16, y = var_1272_to_fp16)[name = tensor("op_1273_cast_fp16")]; tensor denom_31_epsilon_0 = const()[name = tensor("denom_31_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_31_cast_fp16 = rsqrt(epsilon = denom_31_epsilon_0, x = var_1273_cast_fp16)[name = tensor("denom_31_cast_fp16")]; tensor out_31_cast_fp16 = mul(x = zero_mean_31_cast_fp16, y = denom_31_cast_fp16)[name = tensor("out_31_cast_fp16")]; tensor obj_61_gamma_0_to_fp16 = const()[name = tensor("obj_61_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(233123008)))]; tensor obj_61_beta_0_to_fp16 = const()[name = tensor("obj_61_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(233125632)))]; tensor obj_61_epsilon_0_to_fp16 = const()[name = tensor("obj_61_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_61_cast_fp16 = batch_norm(beta = obj_61_beta_0_to_fp16, epsilon = obj_61_epsilon_0_to_fp16, gamma = obj_61_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_31_cast_fp16)[name = tensor("obj_61_cast_fp16")]; tensor var_1288 = const()[name = tensor("op_1288"), val = tensor([1, 1])]; tensor var_1290 = const()[name = tensor("op_1290"), val = tensor([1, 1])]; tensor query_21_pad_type_0 = const()[name = tensor("query_21_pad_type_0"), val = tensor("custom")]; tensor query_21_pad_0 = const()[name = tensor("query_21_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_5_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(233128256))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(234357120))), name = tensor("layers_5_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_5_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_5_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(234357312)))]; tensor query_21_cast_fp16 = conv(bias = layers_5_self_attn_q_proj_bias_to_fp16, dilations = var_1290, groups = var_1253, pad = query_21_pad_0, pad_type = query_21_pad_type_0, strides = var_1288, weight = layers_5_self_attn_q_proj_weight_to_fp16_palettized, x = obj_61_cast_fp16)[name = tensor("query_21_cast_fp16")]; tensor var_1294 = const()[name = tensor("op_1294"), val = tensor([1, 1])]; tensor var_1296 = const()[name = tensor("op_1296"), val = tensor([1, 1])]; tensor current_key_11_pad_type_0 = const()[name = tensor("current_key_11_pad_type_0"), val = tensor("custom")]; tensor current_key_11_pad_0 = const()[name = tensor("current_key_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_5_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(234359936))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(235588800))), name = tensor("layers_5_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_11_cast_fp16 = conv(dilations = var_1296, groups = var_1253, pad = current_key_11_pad_0, pad_type = current_key_11_pad_type_0, strides = var_1294, weight = layers_5_self_attn_k_proj_weight_to_fp16_palettized, x = obj_61_cast_fp16)[name = tensor("current_key_11_cast_fp16")]; tensor var_1301 = const()[name = tensor("op_1301"), val = tensor([1, 1])]; tensor var_1303 = const()[name = tensor("op_1303"), val = tensor([1, 1])]; tensor current_value_11_pad_type_0 = const()[name = tensor("current_value_11_pad_type_0"), val = tensor("custom")]; tensor current_value_11_pad_0 = const()[name = tensor("current_value_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_5_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(235588992))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236408256))), name = tensor("layers_5_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_5_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_5_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236408384)))]; tensor current_value_11_cast_fp16 = conv(bias = layers_5_self_attn_v_proj_bias_to_fp16, dilations = var_1303, groups = var_1253, pad = current_value_11_pad_0, pad_type = current_value_11_pad_type_0, strides = var_1301, weight = layers_5_self_attn_v_proj_weight_to_fp16_palettized, x = obj_61_cast_fp16)[name = tensor("current_value_11_cast_fp16")]; tensor var_1310_cast_fp16 = mul(x = current_key_11_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_1310_cast_fp16")]; tensor var_1312_cast_fp16 = mul(x = var_103_cast_fp16_5, y = var_241_cast_fp16)[name = tensor("op_1312_cast_fp16")]; tensor key_21_cast_fp16 = add(x = var_1310_cast_fp16, y = var_1312_cast_fp16)[name = tensor("key_21_cast_fp16")]; tensor var_1314_cast_fp16 = mul(x = current_value_11_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_1314_cast_fp16")]; tensor var_1316_cast_fp16 = mul(x = var_138_cast_fp16_5, y = var_241_cast_fp16)[name = tensor("op_1316_cast_fp16")]; tensor value_21_cast_fp16 = add(x = var_1314_cast_fp16, y = var_1316_cast_fp16)[name = tensor("value_21_cast_fp16")]; tensor var_1319 = const()[name = tensor("op_1319"), val = tensor([1, 20, 64, -1])]; tensor var_1320_cast_fp16 = reshape(shape = var_1319, x = query_21_cast_fp16)[name = tensor("op_1320_cast_fp16")]; tensor var_1321_to_fp16 = const()[name = tensor("op_1321_to_fp16"), val = tensor(0x1p-3)]; tensor var_1322_cast_fp16 = mul(x = var_1320_cast_fp16, y = var_1321_to_fp16)[name = tensor("op_1322_cast_fp16")]; tensor var_1323 = const()[name = tensor("op_1323"), val = tensor([1, 20, 64, -1])]; tensor var_1324_cast_fp16 = reshape(shape = var_1323, x = key_21_cast_fp16)[name = tensor("op_1324_cast_fp16")]; tensor mh_w_31_transpose_x_0 = const()[name = tensor("mh_w_31_transpose_x_0"), val = tensor(true)]; tensor mh_w_31_transpose_y_0 = const()[name = tensor("mh_w_31_transpose_y_0"), val = tensor(false)]; tensor mh_w_31_cast_fp16 = matmul(transpose_x = mh_w_31_transpose_x_0, transpose_y = mh_w_31_transpose_y_0, x = var_1322_cast_fp16, y = var_1324_cast_fp16)[name = tensor("mh_w_31_cast_fp16")]; tensor mh_w_33_cast_fp16 = add(x = mh_w_31_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_33_cast_fp16")]; tensor var_1332_cast_fp16 = softmax(axis = var_1246, x = mh_w_33_cast_fp16)[name = tensor("op_1332_cast_fp16")]; tensor var_1333 = const()[name = tensor("op_1333"), val = tensor([1, 20, 64, -1])]; tensor var_1334_cast_fp16 = reshape(shape = var_1333, x = value_21_cast_fp16)[name = tensor("op_1334_cast_fp16")]; tensor attn_21_transpose_x_0 = const()[name = tensor("attn_21_transpose_x_0"), val = tensor(false)]; tensor attn_21_transpose_y_0 = const()[name = tensor("attn_21_transpose_y_0"), val = tensor(true)]; tensor attn_21_cast_fp16 = matmul(transpose_x = attn_21_transpose_x_0, transpose_y = attn_21_transpose_y_0, x = var_1334_cast_fp16, y = var_1332_cast_fp16)[name = tensor("attn_21_cast_fp16")]; tensor var_1337 = const()[name = tensor("op_1337"), val = tensor([1, 1280, 1, -1])]; tensor input_51_cast_fp16 = reshape(shape = var_1337, x = attn_21_cast_fp16)[name = tensor("input_51_cast_fp16")]; tensor var_1341 = const()[name = tensor("op_1341"), val = tensor([1, 1])]; tensor var_1343 = const()[name = tensor("op_1343"), val = tensor([1, 1])]; tensor obj_67_pad_type_0 = const()[name = tensor("obj_67_pad_type_0"), val = tensor("custom")]; tensor obj_67_pad_0 = const()[name = tensor("obj_67_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_5_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236411008))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237639872))), name = tensor("layers_5_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_5_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_5_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237640064)))]; tensor obj_67_cast_fp16 = conv(bias = layers_5_self_attn_o_proj_bias_to_fp16, dilations = var_1343, groups = var_1253, pad = obj_67_pad_0, pad_type = obj_67_pad_type_0, strides = var_1341, weight = layers_5_self_attn_o_proj_weight_to_fp16_palettized, x = input_51_cast_fp16)[name = tensor("obj_67_cast_fp16")]; tensor inputs_33_cast_fp16 = add(x = inputs_31_cast_fp16, y = obj_67_cast_fp16)[name = tensor("inputs_33_cast_fp16")]; tensor var_1353 = const()[name = tensor("op_1353"), val = tensor([1])]; tensor channels_mean_33_cast_fp16 = reduce_mean(axes = var_1353, keep_dims = var_1254, x = inputs_33_cast_fp16)[name = tensor("channels_mean_33_cast_fp16")]; tensor zero_mean_33_cast_fp16 = sub(x = inputs_33_cast_fp16, y = channels_mean_33_cast_fp16)[name = tensor("zero_mean_33_cast_fp16")]; tensor zero_mean_sq_33_cast_fp16 = mul(x = zero_mean_33_cast_fp16, y = zero_mean_33_cast_fp16)[name = tensor("zero_mean_sq_33_cast_fp16")]; tensor var_1357 = const()[name = tensor("op_1357"), val = tensor([1])]; tensor var_1358_cast_fp16 = reduce_mean(axes = var_1357, keep_dims = var_1254, x = zero_mean_sq_33_cast_fp16)[name = tensor("op_1358_cast_fp16")]; tensor var_1359_to_fp16 = const()[name = tensor("op_1359_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1360_cast_fp16 = add(x = var_1358_cast_fp16, y = var_1359_to_fp16)[name = tensor("op_1360_cast_fp16")]; tensor denom_33_epsilon_0 = const()[name = tensor("denom_33_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_33_cast_fp16 = rsqrt(epsilon = denom_33_epsilon_0, x = var_1360_cast_fp16)[name = tensor("denom_33_cast_fp16")]; tensor out_33_cast_fp16 = mul(x = zero_mean_33_cast_fp16, y = denom_33_cast_fp16)[name = tensor("out_33_cast_fp16")]; tensor obj_69_gamma_0_to_fp16 = const()[name = tensor("obj_69_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237642688)))]; tensor obj_69_beta_0_to_fp16 = const()[name = tensor("obj_69_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237645312)))]; tensor obj_69_epsilon_0_to_fp16 = const()[name = tensor("obj_69_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_69_cast_fp16 = batch_norm(beta = obj_69_beta_0_to_fp16, epsilon = obj_69_epsilon_0_to_fp16, gamma = obj_69_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_33_cast_fp16)[name = tensor("obj_69_cast_fp16")]; tensor var_1375 = const()[name = tensor("op_1375"), val = tensor([1, 1])]; tensor var_1377 = const()[name = tensor("op_1377"), val = tensor([1, 1])]; tensor query_23_pad_type_0 = const()[name = tensor("query_23_pad_type_0"), val = tensor("custom")]; tensor query_23_pad_0 = const()[name = tensor("query_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_5_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(237647936))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(238467200))), name = tensor("layers_5_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_5_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_5_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(238467328)))]; tensor query_23_cast_fp16 = conv(bias = layers_5_encoder_attn_q_proj_bias_to_fp16, dilations = var_1377, groups = var_1253, pad = query_23_pad_0, pad_type = query_23_pad_type_0, strides = var_1375, weight = layers_5_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_69_cast_fp16)[name = tensor("query_23_cast_fp16")]; tensor var_1381 = const()[name = tensor("op_1381"), val = tensor([1, 1])]; tensor var_1383 = const()[name = tensor("op_1383"), val = tensor([1, 1])]; tensor key_23_pad_type_0 = const()[name = tensor("key_23_pad_type_0"), val = tensor("custom")]; tensor key_23_pad_0 = const()[name = tensor("key_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_5_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(238469952))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(239289216))), name = tensor("layers_5_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_23_cast_fp16 = conv(dilations = var_1383, groups = var_1253, pad = key_23_pad_0, pad_type = key_23_pad_type_0, strides = var_1381, weight = layers_5_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_23_cast_fp16")]; tensor var_1388 = const()[name = tensor("op_1388"), val = tensor([1, 1])]; tensor var_1390 = const()[name = tensor("op_1390"), val = tensor([1, 1])]; tensor value_23_pad_type_0 = const()[name = tensor("value_23_pad_type_0"), val = tensor("custom")]; tensor value_23_pad_0 = const()[name = tensor("value_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_5_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(239289344))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240108608))), name = tensor("layers_5_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_5_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_5_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240108736)))]; tensor value_23_cast_fp16 = conv(bias = layers_5_encoder_attn_v_proj_bias_to_fp16, dilations = var_1390, groups = var_1253, pad = value_23_pad_0, pad_type = value_23_pad_type_0, strides = var_1388, weight = layers_5_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_23_cast_fp16")]; tensor var_1394 = const()[name = tensor("op_1394"), val = tensor([1, 20, 64, -1])]; tensor var_1395_cast_fp16 = reshape(shape = var_1394, x = query_23_cast_fp16)[name = tensor("op_1395_cast_fp16")]; tensor var_1396_to_fp16 = const()[name = tensor("op_1396_to_fp16"), val = tensor(0x1p-3)]; tensor var_1397_cast_fp16 = mul(x = var_1395_cast_fp16, y = var_1396_to_fp16)[name = tensor("op_1397_cast_fp16")]; tensor var_1398 = const()[name = tensor("op_1398"), val = tensor([1, 20, 64, -1])]; tensor var_1399_cast_fp16 = reshape(shape = var_1398, x = key_23_cast_fp16)[name = tensor("op_1399_cast_fp16")]; tensor mh_w_35_transpose_x_0 = const()[name = tensor("mh_w_35_transpose_x_0"), val = tensor(true)]; tensor mh_w_35_transpose_y_0 = const()[name = tensor("mh_w_35_transpose_y_0"), val = tensor(false)]; tensor mh_w_35_cast_fp16 = matmul(transpose_x = mh_w_35_transpose_x_0, transpose_y = mh_w_35_transpose_y_0, x = var_1397_cast_fp16, y = var_1399_cast_fp16)[name = tensor("mh_w_35_cast_fp16")]; tensor var_1402_cast_fp16 = softmax(axis = var_1246, x = mh_w_35_cast_fp16)[name = tensor("op_1402_cast_fp16")]; tensor var_1403 = const()[name = tensor("op_1403"), val = tensor([1, 20, 64, -1])]; tensor var_1404_cast_fp16 = reshape(shape = var_1403, x = value_23_cast_fp16)[name = tensor("op_1404_cast_fp16")]; tensor attn_23_transpose_x_0 = const()[name = tensor("attn_23_transpose_x_0"), val = tensor(false)]; tensor attn_23_transpose_y_0 = const()[name = tensor("attn_23_transpose_y_0"), val = tensor(true)]; tensor attn_23_cast_fp16 = matmul(transpose_x = attn_23_transpose_x_0, transpose_y = attn_23_transpose_y_0, x = var_1404_cast_fp16, y = var_1402_cast_fp16)[name = tensor("attn_23_cast_fp16")]; tensor var_1407 = const()[name = tensor("op_1407"), val = tensor([1, 1280, 1, -1])]; tensor input_53_cast_fp16 = reshape(shape = var_1407, x = attn_23_cast_fp16)[name = tensor("input_53_cast_fp16")]; tensor var_1411 = const()[name = tensor("op_1411"), val = tensor([1, 1])]; tensor var_1413 = const()[name = tensor("op_1413"), val = tensor([1, 1])]; tensor obj_71_pad_type_0 = const()[name = tensor("obj_71_pad_type_0"), val = tensor("custom")]; tensor obj_71_pad_0 = const()[name = tensor("obj_71_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_5_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240111360))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241340224))), name = tensor("layers_5_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_5_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_5_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241340416)))]; tensor obj_71_cast_fp16 = conv(bias = layers_5_encoder_attn_o_proj_bias_to_fp16, dilations = var_1413, groups = var_1253, pad = obj_71_pad_0, pad_type = obj_71_pad_type_0, strides = var_1411, weight = layers_5_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_53_cast_fp16)[name = tensor("obj_71_cast_fp16")]; tensor inputs_35_cast_fp16 = add(x = inputs_33_cast_fp16, y = obj_71_cast_fp16)[name = tensor("inputs_35_cast_fp16")]; tensor var_1419 = const()[name = tensor("op_1419"), val = tensor([1])]; tensor channels_mean_35_cast_fp16 = reduce_mean(axes = var_1419, keep_dims = var_1254, x = inputs_35_cast_fp16)[name = tensor("channels_mean_35_cast_fp16")]; tensor zero_mean_35_cast_fp16 = sub(x = inputs_35_cast_fp16, y = channels_mean_35_cast_fp16)[name = tensor("zero_mean_35_cast_fp16")]; tensor zero_mean_sq_35_cast_fp16 = mul(x = zero_mean_35_cast_fp16, y = zero_mean_35_cast_fp16)[name = tensor("zero_mean_sq_35_cast_fp16")]; tensor var_1423 = const()[name = tensor("op_1423"), val = tensor([1])]; tensor var_1424_cast_fp16 = reduce_mean(axes = var_1423, keep_dims = var_1254, x = zero_mean_sq_35_cast_fp16)[name = tensor("op_1424_cast_fp16")]; tensor var_1425_to_fp16 = const()[name = tensor("op_1425_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1426_cast_fp16 = add(x = var_1424_cast_fp16, y = var_1425_to_fp16)[name = tensor("op_1426_cast_fp16")]; tensor denom_35_epsilon_0 = const()[name = tensor("denom_35_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_35_cast_fp16 = rsqrt(epsilon = denom_35_epsilon_0, x = var_1426_cast_fp16)[name = tensor("denom_35_cast_fp16")]; tensor out_35_cast_fp16 = mul(x = zero_mean_35_cast_fp16, y = denom_35_cast_fp16)[name = tensor("out_35_cast_fp16")]; tensor input_55_gamma_0_to_fp16 = const()[name = tensor("input_55_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241343040)))]; tensor input_55_beta_0_to_fp16 = const()[name = tensor("input_55_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241345664)))]; tensor input_55_epsilon_0_to_fp16 = const()[name = tensor("input_55_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_55_cast_fp16 = batch_norm(beta = input_55_beta_0_to_fp16, epsilon = input_55_epsilon_0_to_fp16, gamma = input_55_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_35_cast_fp16)[name = tensor("input_55_cast_fp16")]; tensor var_1437 = const()[name = tensor("op_1437"), val = tensor([1, 1])]; tensor var_1439 = const()[name = tensor("op_1439"), val = tensor([1, 1])]; tensor input_57_pad_type_0 = const()[name = tensor("input_57_pad_type_0"), val = tensor("custom")]; tensor input_57_pad_0 = const()[name = tensor("input_57_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_5_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(241348288))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246263552))), name = tensor("layers_5_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_5_fc1_bias_to_fp16 = const()[name = tensor("layers_5_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246263744)))]; tensor input_57_cast_fp16 = conv(bias = layers_5_fc1_bias_to_fp16, dilations = var_1439, groups = var_1253, pad = input_57_pad_0, pad_type = input_57_pad_type_0, strides = var_1437, weight = layers_5_fc1_weight_to_fp16_palettized, x = input_55_cast_fp16)[name = tensor("input_57_cast_fp16")]; tensor input_59_mode_0 = const()[name = tensor("input_59_mode_0"), val = tensor("EXACT")]; tensor input_59_cast_fp16 = gelu(mode = input_59_mode_0, x = input_57_cast_fp16)[name = tensor("input_59_cast_fp16")]; tensor var_1445 = const()[name = tensor("op_1445"), val = tensor([1, 1])]; tensor var_1447 = const()[name = tensor("op_1447"), val = tensor([1, 1])]; tensor hidden_states_13_pad_type_0 = const()[name = tensor("hidden_states_13_pad_type_0"), val = tensor("custom")]; tensor hidden_states_13_pad_0 = const()[name = tensor("hidden_states_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_5_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246274048))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(251189312))), name = tensor("layers_5_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_5_fc2_bias_to_fp16 = const()[name = tensor("layers_5_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(251189504)))]; tensor hidden_states_13_cast_fp16 = conv(bias = layers_5_fc2_bias_to_fp16, dilations = var_1447, groups = var_1253, pad = hidden_states_13_pad_0, pad_type = hidden_states_13_pad_type_0, strides = var_1445, weight = layers_5_fc2_weight_to_fp16_palettized, x = input_59_cast_fp16)[name = tensor("hidden_states_13_cast_fp16")]; tensor inputs_37_cast_fp16 = add(x = inputs_35_cast_fp16, y = hidden_states_13_cast_fp16)[name = tensor("inputs_37_cast_fp16")]; tensor var_1460 = const()[name = tensor("op_1460"), val = tensor(3)]; tensor var_1467 = const()[name = tensor("op_1467"), val = tensor(1)]; tensor var_1468 = const()[name = tensor("op_1468"), val = tensor(true)]; tensor var_1480 = const()[name = tensor("op_1480"), val = tensor([1])]; tensor channels_mean_37_cast_fp16 = reduce_mean(axes = var_1480, keep_dims = var_1468, x = inputs_37_cast_fp16)[name = tensor("channels_mean_37_cast_fp16")]; tensor zero_mean_37_cast_fp16 = sub(x = inputs_37_cast_fp16, y = channels_mean_37_cast_fp16)[name = tensor("zero_mean_37_cast_fp16")]; tensor zero_mean_sq_37_cast_fp16 = mul(x = zero_mean_37_cast_fp16, y = zero_mean_37_cast_fp16)[name = tensor("zero_mean_sq_37_cast_fp16")]; tensor var_1484 = const()[name = tensor("op_1484"), val = tensor([1])]; tensor var_1485_cast_fp16 = reduce_mean(axes = var_1484, keep_dims = var_1468, x = zero_mean_sq_37_cast_fp16)[name = tensor("op_1485_cast_fp16")]; tensor var_1486_to_fp16 = const()[name = tensor("op_1486_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1487_cast_fp16 = add(x = var_1485_cast_fp16, y = var_1486_to_fp16)[name = tensor("op_1487_cast_fp16")]; tensor denom_37_epsilon_0 = const()[name = tensor("denom_37_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_37_cast_fp16 = rsqrt(epsilon = denom_37_epsilon_0, x = var_1487_cast_fp16)[name = tensor("denom_37_cast_fp16")]; tensor out_37_cast_fp16 = mul(x = zero_mean_37_cast_fp16, y = denom_37_cast_fp16)[name = tensor("out_37_cast_fp16")]; tensor obj_73_gamma_0_to_fp16 = const()[name = tensor("obj_73_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(251192128)))]; tensor obj_73_beta_0_to_fp16 = const()[name = tensor("obj_73_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(251194752)))]; tensor obj_73_epsilon_0_to_fp16 = const()[name = tensor("obj_73_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_73_cast_fp16 = batch_norm(beta = obj_73_beta_0_to_fp16, epsilon = obj_73_epsilon_0_to_fp16, gamma = obj_73_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_37_cast_fp16)[name = tensor("obj_73_cast_fp16")]; tensor var_1502 = const()[name = tensor("op_1502"), val = tensor([1, 1])]; tensor var_1504 = const()[name = tensor("op_1504"), val = tensor([1, 1])]; tensor query_25_pad_type_0 = const()[name = tensor("query_25_pad_type_0"), val = tensor("custom")]; tensor query_25_pad_0 = const()[name = tensor("query_25_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_6_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(251197376))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(252426240))), name = tensor("layers_6_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_6_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_6_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(252426432)))]; tensor query_25_cast_fp16 = conv(bias = layers_6_self_attn_q_proj_bias_to_fp16, dilations = var_1504, groups = var_1467, pad = query_25_pad_0, pad_type = query_25_pad_type_0, strides = var_1502, weight = layers_6_self_attn_q_proj_weight_to_fp16_palettized, x = obj_73_cast_fp16)[name = tensor("query_25_cast_fp16")]; tensor var_1508 = const()[name = tensor("op_1508"), val = tensor([1, 1])]; tensor var_1510 = const()[name = tensor("op_1510"), val = tensor([1, 1])]; tensor current_key_13_pad_type_0 = const()[name = tensor("current_key_13_pad_type_0"), val = tensor("custom")]; tensor current_key_13_pad_0 = const()[name = tensor("current_key_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_6_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(252429056))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253248320))), name = tensor("layers_6_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_13_cast_fp16 = conv(dilations = var_1510, groups = var_1467, pad = current_key_13_pad_0, pad_type = current_key_13_pad_type_0, strides = var_1508, weight = layers_6_self_attn_k_proj_weight_to_fp16_palettized, x = obj_73_cast_fp16)[name = tensor("current_key_13_cast_fp16")]; tensor var_1515 = const()[name = tensor("op_1515"), val = tensor([1, 1])]; tensor var_1517 = const()[name = tensor("op_1517"), val = tensor([1, 1])]; tensor current_value_13_pad_type_0 = const()[name = tensor("current_value_13_pad_type_0"), val = tensor("custom")]; tensor current_value_13_pad_0 = const()[name = tensor("current_value_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_6_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253248448))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254067712))), name = tensor("layers_6_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_6_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_6_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254067840)))]; tensor current_value_13_cast_fp16 = conv(bias = layers_6_self_attn_v_proj_bias_to_fp16, dilations = var_1517, groups = var_1467, pad = current_value_13_pad_0, pad_type = current_value_13_pad_type_0, strides = var_1515, weight = layers_6_self_attn_v_proj_weight_to_fp16_palettized, x = obj_73_cast_fp16)[name = tensor("current_value_13_cast_fp16")]; tensor var_1524_cast_fp16 = mul(x = current_key_13_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_1524_cast_fp16")]; tensor var_1526_cast_fp16 = mul(x = var_103_cast_fp16_6, y = var_241_cast_fp16)[name = tensor("op_1526_cast_fp16")]; tensor key_25_cast_fp16 = add(x = var_1524_cast_fp16, y = var_1526_cast_fp16)[name = tensor("key_25_cast_fp16")]; tensor var_1528_cast_fp16 = mul(x = current_value_13_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_1528_cast_fp16")]; tensor var_1530_cast_fp16 = mul(x = var_138_cast_fp16_6, y = var_241_cast_fp16)[name = tensor("op_1530_cast_fp16")]; tensor value_25_cast_fp16 = add(x = var_1528_cast_fp16, y = var_1530_cast_fp16)[name = tensor("value_25_cast_fp16")]; tensor var_1533 = const()[name = tensor("op_1533"), val = tensor([1, 20, 64, -1])]; tensor var_1534_cast_fp16 = reshape(shape = var_1533, x = query_25_cast_fp16)[name = tensor("op_1534_cast_fp16")]; tensor var_1535_to_fp16 = const()[name = tensor("op_1535_to_fp16"), val = tensor(0x1p-3)]; tensor var_1536_cast_fp16 = mul(x = var_1534_cast_fp16, y = var_1535_to_fp16)[name = tensor("op_1536_cast_fp16")]; tensor var_1537 = const()[name = tensor("op_1537"), val = tensor([1, 20, 64, -1])]; tensor var_1538_cast_fp16 = reshape(shape = var_1537, x = key_25_cast_fp16)[name = tensor("op_1538_cast_fp16")]; tensor mh_w_37_transpose_x_0 = const()[name = tensor("mh_w_37_transpose_x_0"), val = tensor(true)]; tensor mh_w_37_transpose_y_0 = const()[name = tensor("mh_w_37_transpose_y_0"), val = tensor(false)]; tensor mh_w_37_cast_fp16 = matmul(transpose_x = mh_w_37_transpose_x_0, transpose_y = mh_w_37_transpose_y_0, x = var_1536_cast_fp16, y = var_1538_cast_fp16)[name = tensor("mh_w_37_cast_fp16")]; tensor mh_w_39_cast_fp16 = add(x = mh_w_37_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_39_cast_fp16")]; tensor var_1546_cast_fp16 = softmax(axis = var_1460, x = mh_w_39_cast_fp16)[name = tensor("op_1546_cast_fp16")]; tensor var_1547 = const()[name = tensor("op_1547"), val = tensor([1, 20, 64, -1])]; tensor var_1548_cast_fp16 = reshape(shape = var_1547, x = value_25_cast_fp16)[name = tensor("op_1548_cast_fp16")]; tensor attn_25_transpose_x_0 = const()[name = tensor("attn_25_transpose_x_0"), val = tensor(false)]; tensor attn_25_transpose_y_0 = const()[name = tensor("attn_25_transpose_y_0"), val = tensor(true)]; tensor attn_25_cast_fp16 = matmul(transpose_x = attn_25_transpose_x_0, transpose_y = attn_25_transpose_y_0, x = var_1548_cast_fp16, y = var_1546_cast_fp16)[name = tensor("attn_25_cast_fp16")]; tensor var_1551 = const()[name = tensor("op_1551"), val = tensor([1, 1280, 1, -1])]; tensor input_61_cast_fp16 = reshape(shape = var_1551, x = attn_25_cast_fp16)[name = tensor("input_61_cast_fp16")]; tensor var_1555 = const()[name = tensor("op_1555"), val = tensor([1, 1])]; tensor var_1557 = const()[name = tensor("op_1557"), val = tensor([1, 1])]; tensor obj_79_pad_type_0 = const()[name = tensor("obj_79_pad_type_0"), val = tensor("custom")]; tensor obj_79_pad_0 = const()[name = tensor("obj_79_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_6_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(254070464))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255299328))), name = tensor("layers_6_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_6_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_6_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255299520)))]; tensor obj_79_cast_fp16 = conv(bias = layers_6_self_attn_o_proj_bias_to_fp16, dilations = var_1557, groups = var_1467, pad = obj_79_pad_0, pad_type = obj_79_pad_type_0, strides = var_1555, weight = layers_6_self_attn_o_proj_weight_to_fp16_palettized, x = input_61_cast_fp16)[name = tensor("obj_79_cast_fp16")]; tensor inputs_39_cast_fp16 = add(x = inputs_37_cast_fp16, y = obj_79_cast_fp16)[name = tensor("inputs_39_cast_fp16")]; tensor var_1567 = const()[name = tensor("op_1567"), val = tensor([1])]; tensor channels_mean_39_cast_fp16 = reduce_mean(axes = var_1567, keep_dims = var_1468, x = inputs_39_cast_fp16)[name = tensor("channels_mean_39_cast_fp16")]; tensor zero_mean_39_cast_fp16 = sub(x = inputs_39_cast_fp16, y = channels_mean_39_cast_fp16)[name = tensor("zero_mean_39_cast_fp16")]; tensor zero_mean_sq_39_cast_fp16 = mul(x = zero_mean_39_cast_fp16, y = zero_mean_39_cast_fp16)[name = tensor("zero_mean_sq_39_cast_fp16")]; tensor var_1571 = const()[name = tensor("op_1571"), val = tensor([1])]; tensor var_1572_cast_fp16 = reduce_mean(axes = var_1571, keep_dims = var_1468, x = zero_mean_sq_39_cast_fp16)[name = tensor("op_1572_cast_fp16")]; tensor var_1573_to_fp16 = const()[name = tensor("op_1573_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1574_cast_fp16 = add(x = var_1572_cast_fp16, y = var_1573_to_fp16)[name = tensor("op_1574_cast_fp16")]; tensor denom_39_epsilon_0 = const()[name = tensor("denom_39_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_39_cast_fp16 = rsqrt(epsilon = denom_39_epsilon_0, x = var_1574_cast_fp16)[name = tensor("denom_39_cast_fp16")]; tensor out_39_cast_fp16 = mul(x = zero_mean_39_cast_fp16, y = denom_39_cast_fp16)[name = tensor("out_39_cast_fp16")]; tensor obj_81_gamma_0_to_fp16 = const()[name = tensor("obj_81_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255302144)))]; tensor obj_81_beta_0_to_fp16 = const()[name = tensor("obj_81_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255304768)))]; tensor obj_81_epsilon_0_to_fp16 = const()[name = tensor("obj_81_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_81_cast_fp16 = batch_norm(beta = obj_81_beta_0_to_fp16, epsilon = obj_81_epsilon_0_to_fp16, gamma = obj_81_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_39_cast_fp16)[name = tensor("obj_81_cast_fp16")]; tensor var_1589 = const()[name = tensor("op_1589"), val = tensor([1, 1])]; tensor var_1591 = const()[name = tensor("op_1591"), val = tensor([1, 1])]; tensor query_27_pad_type_0 = const()[name = tensor("query_27_pad_type_0"), val = tensor("custom")]; tensor query_27_pad_0 = const()[name = tensor("query_27_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_6_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(255307392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256126656))), name = tensor("layers_6_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_6_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_6_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256126784)))]; tensor query_27_cast_fp16 = conv(bias = layers_6_encoder_attn_q_proj_bias_to_fp16, dilations = var_1591, groups = var_1467, pad = query_27_pad_0, pad_type = query_27_pad_type_0, strides = var_1589, weight = layers_6_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_81_cast_fp16)[name = tensor("query_27_cast_fp16")]; tensor var_1595 = const()[name = tensor("op_1595"), val = tensor([1, 1])]; tensor var_1597 = const()[name = tensor("op_1597"), val = tensor([1, 1])]; tensor key_27_pad_type_0 = const()[name = tensor("key_27_pad_type_0"), val = tensor("custom")]; tensor key_27_pad_0 = const()[name = tensor("key_27_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_6_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256129408))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256948672))), name = tensor("layers_6_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_27_cast_fp16 = conv(dilations = var_1597, groups = var_1467, pad = key_27_pad_0, pad_type = key_27_pad_type_0, strides = var_1595, weight = layers_6_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_27_cast_fp16")]; tensor var_1602 = const()[name = tensor("op_1602"), val = tensor([1, 1])]; tensor var_1604 = const()[name = tensor("op_1604"), val = tensor([1, 1])]; tensor value_27_pad_type_0 = const()[name = tensor("value_27_pad_type_0"), val = tensor("custom")]; tensor value_27_pad_0 = const()[name = tensor("value_27_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_6_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(256948800))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(257768064))), name = tensor("layers_6_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_6_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_6_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(257768192)))]; tensor value_27_cast_fp16 = conv(bias = layers_6_encoder_attn_v_proj_bias_to_fp16, dilations = var_1604, groups = var_1467, pad = value_27_pad_0, pad_type = value_27_pad_type_0, strides = var_1602, weight = layers_6_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_27_cast_fp16")]; tensor var_1608 = const()[name = tensor("op_1608"), val = tensor([1, 20, 64, -1])]; tensor var_1609_cast_fp16 = reshape(shape = var_1608, x = query_27_cast_fp16)[name = tensor("op_1609_cast_fp16")]; tensor var_1610_to_fp16 = const()[name = tensor("op_1610_to_fp16"), val = tensor(0x1p-3)]; tensor var_1611_cast_fp16 = mul(x = var_1609_cast_fp16, y = var_1610_to_fp16)[name = tensor("op_1611_cast_fp16")]; tensor var_1612 = const()[name = tensor("op_1612"), val = tensor([1, 20, 64, -1])]; tensor var_1613_cast_fp16 = reshape(shape = var_1612, x = key_27_cast_fp16)[name = tensor("op_1613_cast_fp16")]; tensor mh_w_41_transpose_x_0 = const()[name = tensor("mh_w_41_transpose_x_0"), val = tensor(true)]; tensor mh_w_41_transpose_y_0 = const()[name = tensor("mh_w_41_transpose_y_0"), val = tensor(false)]; tensor mh_w_41_cast_fp16 = matmul(transpose_x = mh_w_41_transpose_x_0, transpose_y = mh_w_41_transpose_y_0, x = var_1611_cast_fp16, y = var_1613_cast_fp16)[name = tensor("mh_w_41_cast_fp16")]; tensor var_1616_cast_fp16 = softmax(axis = var_1460, x = mh_w_41_cast_fp16)[name = tensor("op_1616_cast_fp16")]; tensor var_1617 = const()[name = tensor("op_1617"), val = tensor([1, 20, 64, -1])]; tensor var_1618_cast_fp16 = reshape(shape = var_1617, x = value_27_cast_fp16)[name = tensor("op_1618_cast_fp16")]; tensor attn_27_transpose_x_0 = const()[name = tensor("attn_27_transpose_x_0"), val = tensor(false)]; tensor attn_27_transpose_y_0 = const()[name = tensor("attn_27_transpose_y_0"), val = tensor(true)]; tensor attn_27_cast_fp16 = matmul(transpose_x = attn_27_transpose_x_0, transpose_y = attn_27_transpose_y_0, x = var_1618_cast_fp16, y = var_1616_cast_fp16)[name = tensor("attn_27_cast_fp16")]; tensor var_1621 = const()[name = tensor("op_1621"), val = tensor([1, 1280, 1, -1])]; tensor input_63_cast_fp16 = reshape(shape = var_1621, x = attn_27_cast_fp16)[name = tensor("input_63_cast_fp16")]; tensor var_1625 = const()[name = tensor("op_1625"), val = tensor([1, 1])]; tensor var_1627 = const()[name = tensor("op_1627"), val = tensor([1, 1])]; tensor obj_83_pad_type_0 = const()[name = tensor("obj_83_pad_type_0"), val = tensor("custom")]; tensor obj_83_pad_0 = const()[name = tensor("obj_83_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_6_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(257770816))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259409280))), name = tensor("layers_6_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_6_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_6_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259409856)))]; tensor obj_83_cast_fp16 = conv(bias = layers_6_encoder_attn_o_proj_bias_to_fp16, dilations = var_1627, groups = var_1467, pad = obj_83_pad_0, pad_type = obj_83_pad_type_0, strides = var_1625, weight = layers_6_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_63_cast_fp16)[name = tensor("obj_83_cast_fp16")]; tensor inputs_41_cast_fp16 = add(x = inputs_39_cast_fp16, y = obj_83_cast_fp16)[name = tensor("inputs_41_cast_fp16")]; tensor var_1633 = const()[name = tensor("op_1633"), val = tensor([1])]; tensor channels_mean_41_cast_fp16 = reduce_mean(axes = var_1633, keep_dims = var_1468, x = inputs_41_cast_fp16)[name = tensor("channels_mean_41_cast_fp16")]; tensor zero_mean_41_cast_fp16 = sub(x = inputs_41_cast_fp16, y = channels_mean_41_cast_fp16)[name = tensor("zero_mean_41_cast_fp16")]; tensor zero_mean_sq_41_cast_fp16 = mul(x = zero_mean_41_cast_fp16, y = zero_mean_41_cast_fp16)[name = tensor("zero_mean_sq_41_cast_fp16")]; tensor var_1637 = const()[name = tensor("op_1637"), val = tensor([1])]; tensor var_1638_cast_fp16 = reduce_mean(axes = var_1637, keep_dims = var_1468, x = zero_mean_sq_41_cast_fp16)[name = tensor("op_1638_cast_fp16")]; tensor var_1639_to_fp16 = const()[name = tensor("op_1639_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1640_cast_fp16 = add(x = var_1638_cast_fp16, y = var_1639_to_fp16)[name = tensor("op_1640_cast_fp16")]; tensor denom_41_epsilon_0 = const()[name = tensor("denom_41_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_41_cast_fp16 = rsqrt(epsilon = denom_41_epsilon_0, x = var_1640_cast_fp16)[name = tensor("denom_41_cast_fp16")]; tensor out_41_cast_fp16 = mul(x = zero_mean_41_cast_fp16, y = denom_41_cast_fp16)[name = tensor("out_41_cast_fp16")]; tensor input_65_gamma_0_to_fp16 = const()[name = tensor("input_65_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259412480)))]; tensor input_65_beta_0_to_fp16 = const()[name = tensor("input_65_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259415104)))]; tensor input_65_epsilon_0_to_fp16 = const()[name = tensor("input_65_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_65_cast_fp16 = batch_norm(beta = input_65_beta_0_to_fp16, epsilon = input_65_epsilon_0_to_fp16, gamma = input_65_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_41_cast_fp16)[name = tensor("input_65_cast_fp16")]; tensor var_1651 = const()[name = tensor("op_1651"), val = tensor([1, 1])]; tensor var_1653 = const()[name = tensor("op_1653"), val = tensor([1, 1])]; tensor input_67_pad_type_0 = const()[name = tensor("input_67_pad_type_0"), val = tensor("custom")]; tensor input_67_pad_0 = const()[name = tensor("input_67_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_6_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(259417728))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(264332992))), name = tensor("layers_6_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_6_fc1_bias_to_fp16 = const()[name = tensor("layers_6_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(264333184)))]; tensor input_67_cast_fp16 = conv(bias = layers_6_fc1_bias_to_fp16, dilations = var_1653, groups = var_1467, pad = input_67_pad_0, pad_type = input_67_pad_type_0, strides = var_1651, weight = layers_6_fc1_weight_to_fp16_palettized, x = input_65_cast_fp16)[name = tensor("input_67_cast_fp16")]; tensor input_69_mode_0 = const()[name = tensor("input_69_mode_0"), val = tensor("EXACT")]; tensor input_69_cast_fp16 = gelu(mode = input_69_mode_0, x = input_67_cast_fp16)[name = tensor("input_69_cast_fp16")]; tensor var_1659 = const()[name = tensor("op_1659"), val = tensor([1, 1])]; tensor var_1661 = const()[name = tensor("op_1661"), val = tensor([1, 1])]; tensor hidden_states_15_pad_type_0 = const()[name = tensor("hidden_states_15_pad_type_0"), val = tensor("custom")]; tensor hidden_states_15_pad_0 = const()[name = tensor("hidden_states_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_6_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(264343488))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270897152))), name = tensor("layers_6_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_6_fc2_bias_to_fp16 = const()[name = tensor("layers_6_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270897728)))]; tensor hidden_states_15_cast_fp16 = conv(bias = layers_6_fc2_bias_to_fp16, dilations = var_1661, groups = var_1467, pad = hidden_states_15_pad_0, pad_type = hidden_states_15_pad_type_0, strides = var_1659, weight = layers_6_fc2_weight_to_fp16_palettized, x = input_69_cast_fp16)[name = tensor("hidden_states_15_cast_fp16")]; tensor inputs_43_cast_fp16 = add(x = inputs_41_cast_fp16, y = hidden_states_15_cast_fp16)[name = tensor("inputs_43_cast_fp16")]; tensor var_1674 = const()[name = tensor("op_1674"), val = tensor(3)]; tensor var_1681 = const()[name = tensor("op_1681"), val = tensor(1)]; tensor var_1682 = const()[name = tensor("op_1682"), val = tensor(true)]; tensor var_1694 = const()[name = tensor("op_1694"), val = tensor([1])]; tensor channels_mean_43_cast_fp16 = reduce_mean(axes = var_1694, keep_dims = var_1682, x = inputs_43_cast_fp16)[name = tensor("channels_mean_43_cast_fp16")]; tensor zero_mean_43_cast_fp16 = sub(x = inputs_43_cast_fp16, y = channels_mean_43_cast_fp16)[name = tensor("zero_mean_43_cast_fp16")]; tensor zero_mean_sq_43_cast_fp16 = mul(x = zero_mean_43_cast_fp16, y = zero_mean_43_cast_fp16)[name = tensor("zero_mean_sq_43_cast_fp16")]; tensor var_1698 = const()[name = tensor("op_1698"), val = tensor([1])]; tensor var_1699_cast_fp16 = reduce_mean(axes = var_1698, keep_dims = var_1682, x = zero_mean_sq_43_cast_fp16)[name = tensor("op_1699_cast_fp16")]; tensor var_1700_to_fp16 = const()[name = tensor("op_1700_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1701_cast_fp16 = add(x = var_1699_cast_fp16, y = var_1700_to_fp16)[name = tensor("op_1701_cast_fp16")]; tensor denom_43_epsilon_0 = const()[name = tensor("denom_43_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_43_cast_fp16 = rsqrt(epsilon = denom_43_epsilon_0, x = var_1701_cast_fp16)[name = tensor("denom_43_cast_fp16")]; tensor out_43_cast_fp16 = mul(x = zero_mean_43_cast_fp16, y = denom_43_cast_fp16)[name = tensor("out_43_cast_fp16")]; tensor obj_85_gamma_0_to_fp16 = const()[name = tensor("obj_85_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270900352)))]; tensor obj_85_beta_0_to_fp16 = const()[name = tensor("obj_85_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270902976)))]; tensor obj_85_epsilon_0_to_fp16 = const()[name = tensor("obj_85_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_85_cast_fp16 = batch_norm(beta = obj_85_beta_0_to_fp16, epsilon = obj_85_epsilon_0_to_fp16, gamma = obj_85_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_43_cast_fp16)[name = tensor("obj_85_cast_fp16")]; tensor var_1716 = const()[name = tensor("op_1716"), val = tensor([1, 1])]; tensor var_1718 = const()[name = tensor("op_1718"), val = tensor([1, 1])]; tensor query_29_pad_type_0 = const()[name = tensor("query_29_pad_type_0"), val = tensor("custom")]; tensor query_29_pad_0 = const()[name = tensor("query_29_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_7_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270905600))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272134464))), name = tensor("layers_7_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_7_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_7_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272134656)))]; tensor query_29_cast_fp16 = conv(bias = layers_7_self_attn_q_proj_bias_to_fp16, dilations = var_1718, groups = var_1681, pad = query_29_pad_0, pad_type = query_29_pad_type_0, strides = var_1716, weight = layers_7_self_attn_q_proj_weight_to_fp16_palettized, x = obj_85_cast_fp16)[name = tensor("query_29_cast_fp16")]; tensor var_1722 = const()[name = tensor("op_1722"), val = tensor([1, 1])]; tensor var_1724 = const()[name = tensor("op_1724"), val = tensor([1, 1])]; tensor current_key_15_pad_type_0 = const()[name = tensor("current_key_15_pad_type_0"), val = tensor("custom")]; tensor current_key_15_pad_0 = const()[name = tensor("current_key_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_7_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272137280))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272956544))), name = tensor("layers_7_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_15_cast_fp16 = conv(dilations = var_1724, groups = var_1681, pad = current_key_15_pad_0, pad_type = current_key_15_pad_type_0, strides = var_1722, weight = layers_7_self_attn_k_proj_weight_to_fp16_palettized, x = obj_85_cast_fp16)[name = tensor("current_key_15_cast_fp16")]; tensor var_1729 = const()[name = tensor("op_1729"), val = tensor([1, 1])]; tensor var_1731 = const()[name = tensor("op_1731"), val = tensor([1, 1])]; tensor current_value_15_pad_type_0 = const()[name = tensor("current_value_15_pad_type_0"), val = tensor("custom")]; tensor current_value_15_pad_0 = const()[name = tensor("current_value_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_7_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(272956672))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(273775936))), name = tensor("layers_7_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_7_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_7_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(273776064)))]; tensor current_value_15_cast_fp16 = conv(bias = layers_7_self_attn_v_proj_bias_to_fp16, dilations = var_1731, groups = var_1681, pad = current_value_15_pad_0, pad_type = current_value_15_pad_type_0, strides = var_1729, weight = layers_7_self_attn_v_proj_weight_to_fp16_palettized, x = obj_85_cast_fp16)[name = tensor("current_value_15_cast_fp16")]; tensor var_1738_cast_fp16 = mul(x = current_key_15_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_1738_cast_fp16")]; tensor var_1740_cast_fp16 = mul(x = var_103_cast_fp16_7, y = var_241_cast_fp16)[name = tensor("op_1740_cast_fp16")]; tensor key_29_cast_fp16 = add(x = var_1738_cast_fp16, y = var_1740_cast_fp16)[name = tensor("key_29_cast_fp16")]; tensor var_1742_cast_fp16 = mul(x = current_value_15_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_1742_cast_fp16")]; tensor var_1744_cast_fp16 = mul(x = var_138_cast_fp16_7, y = var_241_cast_fp16)[name = tensor("op_1744_cast_fp16")]; tensor value_29_cast_fp16 = add(x = var_1742_cast_fp16, y = var_1744_cast_fp16)[name = tensor("value_29_cast_fp16")]; tensor var_1747 = const()[name = tensor("op_1747"), val = tensor([1, 20, 64, -1])]; tensor var_1748_cast_fp16 = reshape(shape = var_1747, x = query_29_cast_fp16)[name = tensor("op_1748_cast_fp16")]; tensor var_1749_to_fp16 = const()[name = tensor("op_1749_to_fp16"), val = tensor(0x1p-3)]; tensor var_1750_cast_fp16 = mul(x = var_1748_cast_fp16, y = var_1749_to_fp16)[name = tensor("op_1750_cast_fp16")]; tensor var_1751 = const()[name = tensor("op_1751"), val = tensor([1, 20, 64, -1])]; tensor var_1752_cast_fp16 = reshape(shape = var_1751, x = key_29_cast_fp16)[name = tensor("op_1752_cast_fp16")]; tensor mh_w_43_transpose_x_0 = const()[name = tensor("mh_w_43_transpose_x_0"), val = tensor(true)]; tensor mh_w_43_transpose_y_0 = const()[name = tensor("mh_w_43_transpose_y_0"), val = tensor(false)]; tensor mh_w_43_cast_fp16 = matmul(transpose_x = mh_w_43_transpose_x_0, transpose_y = mh_w_43_transpose_y_0, x = var_1750_cast_fp16, y = var_1752_cast_fp16)[name = tensor("mh_w_43_cast_fp16")]; tensor mh_w_45_cast_fp16 = add(x = mh_w_43_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_45_cast_fp16")]; tensor var_1760_cast_fp16 = softmax(axis = var_1674, x = mh_w_45_cast_fp16)[name = tensor("op_1760_cast_fp16")]; tensor var_1761 = const()[name = tensor("op_1761"), val = tensor([1, 20, 64, -1])]; tensor var_1762_cast_fp16 = reshape(shape = var_1761, x = value_29_cast_fp16)[name = tensor("op_1762_cast_fp16")]; tensor attn_29_transpose_x_0 = const()[name = tensor("attn_29_transpose_x_0"), val = tensor(false)]; tensor attn_29_transpose_y_0 = const()[name = tensor("attn_29_transpose_y_0"), val = tensor(true)]; tensor attn_29_cast_fp16 = matmul(transpose_x = attn_29_transpose_x_0, transpose_y = attn_29_transpose_y_0, x = var_1762_cast_fp16, y = var_1760_cast_fp16)[name = tensor("attn_29_cast_fp16")]; tensor var_1765 = const()[name = tensor("op_1765"), val = tensor([1, 1280, 1, -1])]; tensor input_71_cast_fp16 = reshape(shape = var_1765, x = attn_29_cast_fp16)[name = tensor("input_71_cast_fp16")]; tensor var_1769 = const()[name = tensor("op_1769"), val = tensor([1, 1])]; tensor var_1771 = const()[name = tensor("op_1771"), val = tensor([1, 1])]; tensor obj_91_pad_type_0 = const()[name = tensor("obj_91_pad_type_0"), val = tensor("custom")]; tensor obj_91_pad_0 = const()[name = tensor("obj_91_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_7_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(273778688))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275007552))), name = tensor("layers_7_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_7_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_7_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275007744)))]; tensor obj_91_cast_fp16 = conv(bias = layers_7_self_attn_o_proj_bias_to_fp16, dilations = var_1771, groups = var_1681, pad = obj_91_pad_0, pad_type = obj_91_pad_type_0, strides = var_1769, weight = layers_7_self_attn_o_proj_weight_to_fp16_palettized, x = input_71_cast_fp16)[name = tensor("obj_91_cast_fp16")]; tensor inputs_45_cast_fp16 = add(x = inputs_43_cast_fp16, y = obj_91_cast_fp16)[name = tensor("inputs_45_cast_fp16")]; tensor var_1781 = const()[name = tensor("op_1781"), val = tensor([1])]; tensor channels_mean_45_cast_fp16 = reduce_mean(axes = var_1781, keep_dims = var_1682, x = inputs_45_cast_fp16)[name = tensor("channels_mean_45_cast_fp16")]; tensor zero_mean_45_cast_fp16 = sub(x = inputs_45_cast_fp16, y = channels_mean_45_cast_fp16)[name = tensor("zero_mean_45_cast_fp16")]; tensor zero_mean_sq_45_cast_fp16 = mul(x = zero_mean_45_cast_fp16, y = zero_mean_45_cast_fp16)[name = tensor("zero_mean_sq_45_cast_fp16")]; tensor var_1785 = const()[name = tensor("op_1785"), val = tensor([1])]; tensor var_1786_cast_fp16 = reduce_mean(axes = var_1785, keep_dims = var_1682, x = zero_mean_sq_45_cast_fp16)[name = tensor("op_1786_cast_fp16")]; tensor var_1787_to_fp16 = const()[name = tensor("op_1787_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1788_cast_fp16 = add(x = var_1786_cast_fp16, y = var_1787_to_fp16)[name = tensor("op_1788_cast_fp16")]; tensor denom_45_epsilon_0 = const()[name = tensor("denom_45_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_45_cast_fp16 = rsqrt(epsilon = denom_45_epsilon_0, x = var_1788_cast_fp16)[name = tensor("denom_45_cast_fp16")]; tensor out_45_cast_fp16 = mul(x = zero_mean_45_cast_fp16, y = denom_45_cast_fp16)[name = tensor("out_45_cast_fp16")]; tensor obj_93_gamma_0_to_fp16 = const()[name = tensor("obj_93_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275010368)))]; tensor obj_93_beta_0_to_fp16 = const()[name = tensor("obj_93_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275012992)))]; tensor obj_93_epsilon_0_to_fp16 = const()[name = tensor("obj_93_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_93_cast_fp16 = batch_norm(beta = obj_93_beta_0_to_fp16, epsilon = obj_93_epsilon_0_to_fp16, gamma = obj_93_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_45_cast_fp16)[name = tensor("obj_93_cast_fp16")]; tensor var_1803 = const()[name = tensor("op_1803"), val = tensor([1, 1])]; tensor var_1805 = const()[name = tensor("op_1805"), val = tensor([1, 1])]; tensor query_31_pad_type_0 = const()[name = tensor("query_31_pad_type_0"), val = tensor("custom")]; tensor query_31_pad_0 = const()[name = tensor("query_31_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_7_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275015616))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275834880))), name = tensor("layers_7_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_7_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_7_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275835008)))]; tensor query_31_cast_fp16 = conv(bias = layers_7_encoder_attn_q_proj_bias_to_fp16, dilations = var_1805, groups = var_1681, pad = query_31_pad_0, pad_type = query_31_pad_type_0, strides = var_1803, weight = layers_7_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_93_cast_fp16)[name = tensor("query_31_cast_fp16")]; tensor var_1809 = const()[name = tensor("op_1809"), val = tensor([1, 1])]; tensor var_1811 = const()[name = tensor("op_1811"), val = tensor([1, 1])]; tensor key_31_pad_type_0 = const()[name = tensor("key_31_pad_type_0"), val = tensor("custom")]; tensor key_31_pad_0 = const()[name = tensor("key_31_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_7_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(275837632))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(276656896))), name = tensor("layers_7_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_31_cast_fp16 = conv(dilations = var_1811, groups = var_1681, pad = key_31_pad_0, pad_type = key_31_pad_type_0, strides = var_1809, weight = layers_7_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_31_cast_fp16")]; tensor var_1816 = const()[name = tensor("op_1816"), val = tensor([1, 1])]; tensor var_1818 = const()[name = tensor("op_1818"), val = tensor([1, 1])]; tensor value_31_pad_type_0 = const()[name = tensor("value_31_pad_type_0"), val = tensor("custom")]; tensor value_31_pad_0 = const()[name = tensor("value_31_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_7_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(276657024))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277885888))), name = tensor("layers_7_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_7_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_7_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277886080)))]; tensor value_31_cast_fp16 = conv(bias = layers_7_encoder_attn_v_proj_bias_to_fp16, dilations = var_1818, groups = var_1681, pad = value_31_pad_0, pad_type = value_31_pad_type_0, strides = var_1816, weight = layers_7_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_31_cast_fp16")]; tensor var_1822 = const()[name = tensor("op_1822"), val = tensor([1, 20, 64, -1])]; tensor var_1823_cast_fp16 = reshape(shape = var_1822, x = query_31_cast_fp16)[name = tensor("op_1823_cast_fp16")]; tensor var_1824_to_fp16 = const()[name = tensor("op_1824_to_fp16"), val = tensor(0x1p-3)]; tensor var_1825_cast_fp16 = mul(x = var_1823_cast_fp16, y = var_1824_to_fp16)[name = tensor("op_1825_cast_fp16")]; tensor var_1826 = const()[name = tensor("op_1826"), val = tensor([1, 20, 64, -1])]; tensor var_1827_cast_fp16 = reshape(shape = var_1826, x = key_31_cast_fp16)[name = tensor("op_1827_cast_fp16")]; tensor mh_w_47_transpose_x_0 = const()[name = tensor("mh_w_47_transpose_x_0"), val = tensor(true)]; tensor mh_w_47_transpose_y_0 = const()[name = tensor("mh_w_47_transpose_y_0"), val = tensor(false)]; tensor mh_w_47_cast_fp16 = matmul(transpose_x = mh_w_47_transpose_x_0, transpose_y = mh_w_47_transpose_y_0, x = var_1825_cast_fp16, y = var_1827_cast_fp16)[name = tensor("mh_w_47_cast_fp16")]; tensor var_1830_cast_fp16 = softmax(axis = var_1674, x = mh_w_47_cast_fp16)[name = tensor("op_1830_cast_fp16")]; tensor var_1831 = const()[name = tensor("op_1831"), val = tensor([1, 20, 64, -1])]; tensor var_1832_cast_fp16 = reshape(shape = var_1831, x = value_31_cast_fp16)[name = tensor("op_1832_cast_fp16")]; tensor attn_31_transpose_x_0 = const()[name = tensor("attn_31_transpose_x_0"), val = tensor(false)]; tensor attn_31_transpose_y_0 = const()[name = tensor("attn_31_transpose_y_0"), val = tensor(true)]; tensor attn_31_cast_fp16 = matmul(transpose_x = attn_31_transpose_x_0, transpose_y = attn_31_transpose_y_0, x = var_1832_cast_fp16, y = var_1830_cast_fp16)[name = tensor("attn_31_cast_fp16")]; tensor var_1835 = const()[name = tensor("op_1835"), val = tensor([1, 1280, 1, -1])]; tensor input_73_cast_fp16 = reshape(shape = var_1835, x = attn_31_cast_fp16)[name = tensor("input_73_cast_fp16")]; tensor var_1839 = const()[name = tensor("op_1839"), val = tensor([1, 1])]; tensor var_1841 = const()[name = tensor("op_1841"), val = tensor([1, 1])]; tensor obj_95_pad_type_0 = const()[name = tensor("obj_95_pad_type_0"), val = tensor("custom")]; tensor obj_95_pad_0 = const()[name = tensor("obj_95_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_7_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(277888704))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(279117568))), name = tensor("layers_7_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_7_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_7_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(279117760)))]; tensor obj_95_cast_fp16 = conv(bias = layers_7_encoder_attn_o_proj_bias_to_fp16, dilations = var_1841, groups = var_1681, pad = obj_95_pad_0, pad_type = obj_95_pad_type_0, strides = var_1839, weight = layers_7_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_73_cast_fp16)[name = tensor("obj_95_cast_fp16")]; tensor inputs_47_cast_fp16 = add(x = inputs_45_cast_fp16, y = obj_95_cast_fp16)[name = tensor("inputs_47_cast_fp16")]; tensor var_1847 = const()[name = tensor("op_1847"), val = tensor([1])]; tensor channels_mean_47_cast_fp16 = reduce_mean(axes = var_1847, keep_dims = var_1682, x = inputs_47_cast_fp16)[name = tensor("channels_mean_47_cast_fp16")]; tensor zero_mean_47_cast_fp16 = sub(x = inputs_47_cast_fp16, y = channels_mean_47_cast_fp16)[name = tensor("zero_mean_47_cast_fp16")]; tensor zero_mean_sq_47_cast_fp16 = mul(x = zero_mean_47_cast_fp16, y = zero_mean_47_cast_fp16)[name = tensor("zero_mean_sq_47_cast_fp16")]; tensor var_1851 = const()[name = tensor("op_1851"), val = tensor([1])]; tensor var_1852_cast_fp16 = reduce_mean(axes = var_1851, keep_dims = var_1682, x = zero_mean_sq_47_cast_fp16)[name = tensor("op_1852_cast_fp16")]; tensor var_1853_to_fp16 = const()[name = tensor("op_1853_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1854_cast_fp16 = add(x = var_1852_cast_fp16, y = var_1853_to_fp16)[name = tensor("op_1854_cast_fp16")]; tensor denom_47_epsilon_0 = const()[name = tensor("denom_47_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_47_cast_fp16 = rsqrt(epsilon = denom_47_epsilon_0, x = var_1854_cast_fp16)[name = tensor("denom_47_cast_fp16")]; tensor out_47_cast_fp16 = mul(x = zero_mean_47_cast_fp16, y = denom_47_cast_fp16)[name = tensor("out_47_cast_fp16")]; tensor input_75_gamma_0_to_fp16 = const()[name = tensor("input_75_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(279120384)))]; tensor input_75_beta_0_to_fp16 = const()[name = tensor("input_75_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(279123008)))]; tensor input_75_epsilon_0_to_fp16 = const()[name = tensor("input_75_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_75_cast_fp16 = batch_norm(beta = input_75_beta_0_to_fp16, epsilon = input_75_epsilon_0_to_fp16, gamma = input_75_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_47_cast_fp16)[name = tensor("input_75_cast_fp16")]; tensor var_1865 = const()[name = tensor("op_1865"), val = tensor([1, 1])]; tensor var_1867 = const()[name = tensor("op_1867"), val = tensor([1, 1])]; tensor input_77_pad_type_0 = const()[name = tensor("input_77_pad_type_0"), val = tensor("custom")]; tensor input_77_pad_0 = const()[name = tensor("input_77_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_7_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(279125632))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(284040896))), name = tensor("layers_7_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_7_fc1_bias_to_fp16 = const()[name = tensor("layers_7_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(284041088)))]; tensor input_77_cast_fp16 = conv(bias = layers_7_fc1_bias_to_fp16, dilations = var_1867, groups = var_1681, pad = input_77_pad_0, pad_type = input_77_pad_type_0, strides = var_1865, weight = layers_7_fc1_weight_to_fp16_palettized, x = input_75_cast_fp16)[name = tensor("input_77_cast_fp16")]; tensor input_79_mode_0 = const()[name = tensor("input_79_mode_0"), val = tensor("EXACT")]; tensor input_79_cast_fp16 = gelu(mode = input_79_mode_0, x = input_77_cast_fp16)[name = tensor("input_79_cast_fp16")]; tensor var_1873 = const()[name = tensor("op_1873"), val = tensor([1, 1])]; tensor var_1875 = const()[name = tensor("op_1875"), val = tensor([1, 1])]; tensor hidden_states_17_pad_type_0 = const()[name = tensor("hidden_states_17_pad_type_0"), val = tensor("custom")]; tensor hidden_states_17_pad_0 = const()[name = tensor("hidden_states_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_7_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(284051392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(288966656))), name = tensor("layers_7_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_7_fc2_bias_to_fp16 = const()[name = tensor("layers_7_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(288966848)))]; tensor hidden_states_17_cast_fp16 = conv(bias = layers_7_fc2_bias_to_fp16, dilations = var_1875, groups = var_1681, pad = hidden_states_17_pad_0, pad_type = hidden_states_17_pad_type_0, strides = var_1873, weight = layers_7_fc2_weight_to_fp16_palettized, x = input_79_cast_fp16)[name = tensor("hidden_states_17_cast_fp16")]; tensor inputs_49_cast_fp16 = add(x = inputs_47_cast_fp16, y = hidden_states_17_cast_fp16)[name = tensor("inputs_49_cast_fp16")]; tensor var_1888 = const()[name = tensor("op_1888"), val = tensor(3)]; tensor var_1895 = const()[name = tensor("op_1895"), val = tensor(1)]; tensor var_1896 = const()[name = tensor("op_1896"), val = tensor(true)]; tensor var_1908 = const()[name = tensor("op_1908"), val = tensor([1])]; tensor channels_mean_49_cast_fp16 = reduce_mean(axes = var_1908, keep_dims = var_1896, x = inputs_49_cast_fp16)[name = tensor("channels_mean_49_cast_fp16")]; tensor zero_mean_49_cast_fp16 = sub(x = inputs_49_cast_fp16, y = channels_mean_49_cast_fp16)[name = tensor("zero_mean_49_cast_fp16")]; tensor zero_mean_sq_49_cast_fp16 = mul(x = zero_mean_49_cast_fp16, y = zero_mean_49_cast_fp16)[name = tensor("zero_mean_sq_49_cast_fp16")]; tensor var_1912 = const()[name = tensor("op_1912"), val = tensor([1])]; tensor var_1913_cast_fp16 = reduce_mean(axes = var_1912, keep_dims = var_1896, x = zero_mean_sq_49_cast_fp16)[name = tensor("op_1913_cast_fp16")]; tensor var_1914_to_fp16 = const()[name = tensor("op_1914_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1915_cast_fp16 = add(x = var_1913_cast_fp16, y = var_1914_to_fp16)[name = tensor("op_1915_cast_fp16")]; tensor denom_49_epsilon_0 = const()[name = tensor("denom_49_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_49_cast_fp16 = rsqrt(epsilon = denom_49_epsilon_0, x = var_1915_cast_fp16)[name = tensor("denom_49_cast_fp16")]; tensor out_49_cast_fp16 = mul(x = zero_mean_49_cast_fp16, y = denom_49_cast_fp16)[name = tensor("out_49_cast_fp16")]; tensor obj_97_gamma_0_to_fp16 = const()[name = tensor("obj_97_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(288969472)))]; tensor obj_97_beta_0_to_fp16 = const()[name = tensor("obj_97_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(288972096)))]; tensor obj_97_epsilon_0_to_fp16 = const()[name = tensor("obj_97_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_97_cast_fp16 = batch_norm(beta = obj_97_beta_0_to_fp16, epsilon = obj_97_epsilon_0_to_fp16, gamma = obj_97_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_49_cast_fp16)[name = tensor("obj_97_cast_fp16")]; tensor var_1930 = const()[name = tensor("op_1930"), val = tensor([1, 1])]; tensor var_1932 = const()[name = tensor("op_1932"), val = tensor([1, 1])]; tensor query_33_pad_type_0 = const()[name = tensor("query_33_pad_type_0"), val = tensor("custom")]; tensor query_33_pad_0 = const()[name = tensor("query_33_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_8_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(288974720))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(290203584))), name = tensor("layers_8_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_8_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_8_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(290203776)))]; tensor query_33_cast_fp16 = conv(bias = layers_8_self_attn_q_proj_bias_to_fp16, dilations = var_1932, groups = var_1895, pad = query_33_pad_0, pad_type = query_33_pad_type_0, strides = var_1930, weight = layers_8_self_attn_q_proj_weight_to_fp16_palettized, x = obj_97_cast_fp16)[name = tensor("query_33_cast_fp16")]; tensor var_1936 = const()[name = tensor("op_1936"), val = tensor([1, 1])]; tensor var_1938 = const()[name = tensor("op_1938"), val = tensor([1, 1])]; tensor current_key_17_pad_type_0 = const()[name = tensor("current_key_17_pad_type_0"), val = tensor("custom")]; tensor current_key_17_pad_0 = const()[name = tensor("current_key_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_8_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(290206400))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291435264))), name = tensor("layers_8_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_17_cast_fp16 = conv(dilations = var_1938, groups = var_1895, pad = current_key_17_pad_0, pad_type = current_key_17_pad_type_0, strides = var_1936, weight = layers_8_self_attn_k_proj_weight_to_fp16_palettized, x = obj_97_cast_fp16)[name = tensor("current_key_17_cast_fp16")]; tensor var_1943 = const()[name = tensor("op_1943"), val = tensor([1, 1])]; tensor var_1945 = const()[name = tensor("op_1945"), val = tensor([1, 1])]; tensor current_value_17_pad_type_0 = const()[name = tensor("current_value_17_pad_type_0"), val = tensor("custom")]; tensor current_value_17_pad_0 = const()[name = tensor("current_value_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_8_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291435456))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(292254720))), name = tensor("layers_8_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_8_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_8_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(292254848)))]; tensor current_value_17_cast_fp16 = conv(bias = layers_8_self_attn_v_proj_bias_to_fp16, dilations = var_1945, groups = var_1895, pad = current_value_17_pad_0, pad_type = current_value_17_pad_type_0, strides = var_1943, weight = layers_8_self_attn_v_proj_weight_to_fp16_palettized, x = obj_97_cast_fp16)[name = tensor("current_value_17_cast_fp16")]; tensor var_1952_cast_fp16 = mul(x = current_key_17_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_1952_cast_fp16")]; tensor var_1954_cast_fp16 = mul(x = var_103_cast_fp16_8, y = var_241_cast_fp16)[name = tensor("op_1954_cast_fp16")]; tensor key_33_cast_fp16 = add(x = var_1952_cast_fp16, y = var_1954_cast_fp16)[name = tensor("key_33_cast_fp16")]; tensor var_1956_cast_fp16 = mul(x = current_value_17_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_1956_cast_fp16")]; tensor var_1958_cast_fp16 = mul(x = var_138_cast_fp16_8, y = var_241_cast_fp16)[name = tensor("op_1958_cast_fp16")]; tensor value_33_cast_fp16 = add(x = var_1956_cast_fp16, y = var_1958_cast_fp16)[name = tensor("value_33_cast_fp16")]; tensor var_1961 = const()[name = tensor("op_1961"), val = tensor([1, 20, 64, -1])]; tensor var_1962_cast_fp16 = reshape(shape = var_1961, x = query_33_cast_fp16)[name = tensor("op_1962_cast_fp16")]; tensor var_1963_to_fp16 = const()[name = tensor("op_1963_to_fp16"), val = tensor(0x1p-3)]; tensor var_1964_cast_fp16 = mul(x = var_1962_cast_fp16, y = var_1963_to_fp16)[name = tensor("op_1964_cast_fp16")]; tensor var_1965 = const()[name = tensor("op_1965"), val = tensor([1, 20, 64, -1])]; tensor var_1966_cast_fp16 = reshape(shape = var_1965, x = key_33_cast_fp16)[name = tensor("op_1966_cast_fp16")]; tensor mh_w_49_transpose_x_0 = const()[name = tensor("mh_w_49_transpose_x_0"), val = tensor(true)]; tensor mh_w_49_transpose_y_0 = const()[name = tensor("mh_w_49_transpose_y_0"), val = tensor(false)]; tensor mh_w_49_cast_fp16 = matmul(transpose_x = mh_w_49_transpose_x_0, transpose_y = mh_w_49_transpose_y_0, x = var_1964_cast_fp16, y = var_1966_cast_fp16)[name = tensor("mh_w_49_cast_fp16")]; tensor mh_w_51_cast_fp16 = add(x = mh_w_49_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_51_cast_fp16")]; tensor var_1974_cast_fp16 = softmax(axis = var_1888, x = mh_w_51_cast_fp16)[name = tensor("op_1974_cast_fp16")]; tensor var_1975 = const()[name = tensor("op_1975"), val = tensor([1, 20, 64, -1])]; tensor var_1976_cast_fp16 = reshape(shape = var_1975, x = value_33_cast_fp16)[name = tensor("op_1976_cast_fp16")]; tensor attn_33_transpose_x_0 = const()[name = tensor("attn_33_transpose_x_0"), val = tensor(false)]; tensor attn_33_transpose_y_0 = const()[name = tensor("attn_33_transpose_y_0"), val = tensor(true)]; tensor attn_33_cast_fp16 = matmul(transpose_x = attn_33_transpose_x_0, transpose_y = attn_33_transpose_y_0, x = var_1976_cast_fp16, y = var_1974_cast_fp16)[name = tensor("attn_33_cast_fp16")]; tensor var_1979 = const()[name = tensor("op_1979"), val = tensor([1, 1280, 1, -1])]; tensor input_81_cast_fp16 = reshape(shape = var_1979, x = attn_33_cast_fp16)[name = tensor("input_81_cast_fp16")]; tensor var_1983 = const()[name = tensor("op_1983"), val = tensor([1, 1])]; tensor var_1985 = const()[name = tensor("op_1985"), val = tensor([1, 1])]; tensor obj_103_pad_type_0 = const()[name = tensor("obj_103_pad_type_0"), val = tensor("custom")]; tensor obj_103_pad_0 = const()[name = tensor("obj_103_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_8_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(292257472))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293486336))), name = tensor("layers_8_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_8_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_8_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293486528)))]; tensor obj_103_cast_fp16 = conv(bias = layers_8_self_attn_o_proj_bias_to_fp16, dilations = var_1985, groups = var_1895, pad = obj_103_pad_0, pad_type = obj_103_pad_type_0, strides = var_1983, weight = layers_8_self_attn_o_proj_weight_to_fp16_palettized, x = input_81_cast_fp16)[name = tensor("obj_103_cast_fp16")]; tensor inputs_51_cast_fp16 = add(x = inputs_49_cast_fp16, y = obj_103_cast_fp16)[name = tensor("inputs_51_cast_fp16")]; tensor var_1995 = const()[name = tensor("op_1995"), val = tensor([1])]; tensor channels_mean_51_cast_fp16 = reduce_mean(axes = var_1995, keep_dims = var_1896, x = inputs_51_cast_fp16)[name = tensor("channels_mean_51_cast_fp16")]; tensor zero_mean_51_cast_fp16 = sub(x = inputs_51_cast_fp16, y = channels_mean_51_cast_fp16)[name = tensor("zero_mean_51_cast_fp16")]; tensor zero_mean_sq_51_cast_fp16 = mul(x = zero_mean_51_cast_fp16, y = zero_mean_51_cast_fp16)[name = tensor("zero_mean_sq_51_cast_fp16")]; tensor var_1999 = const()[name = tensor("op_1999"), val = tensor([1])]; tensor var_2000_cast_fp16 = reduce_mean(axes = var_1999, keep_dims = var_1896, x = zero_mean_sq_51_cast_fp16)[name = tensor("op_2000_cast_fp16")]; tensor var_2001_to_fp16 = const()[name = tensor("op_2001_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2002_cast_fp16 = add(x = var_2000_cast_fp16, y = var_2001_to_fp16)[name = tensor("op_2002_cast_fp16")]; tensor denom_51_epsilon_0 = const()[name = tensor("denom_51_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_51_cast_fp16 = rsqrt(epsilon = denom_51_epsilon_0, x = var_2002_cast_fp16)[name = tensor("denom_51_cast_fp16")]; tensor out_51_cast_fp16 = mul(x = zero_mean_51_cast_fp16, y = denom_51_cast_fp16)[name = tensor("out_51_cast_fp16")]; tensor obj_105_gamma_0_to_fp16 = const()[name = tensor("obj_105_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293489152)))]; tensor obj_105_beta_0_to_fp16 = const()[name = tensor("obj_105_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293491776)))]; tensor obj_105_epsilon_0_to_fp16 = const()[name = tensor("obj_105_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_105_cast_fp16 = batch_norm(beta = obj_105_beta_0_to_fp16, epsilon = obj_105_epsilon_0_to_fp16, gamma = obj_105_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_51_cast_fp16)[name = tensor("obj_105_cast_fp16")]; tensor var_2017 = const()[name = tensor("op_2017"), val = tensor([1, 1])]; tensor var_2019 = const()[name = tensor("op_2019"), val = tensor([1, 1])]; tensor query_35_pad_type_0 = const()[name = tensor("query_35_pad_type_0"), val = tensor("custom")]; tensor query_35_pad_0 = const()[name = tensor("query_35_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_8_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293494400))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294723264))), name = tensor("layers_8_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_8_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_8_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294723456)))]; tensor query_35_cast_fp16 = conv(bias = layers_8_encoder_attn_q_proj_bias_to_fp16, dilations = var_2019, groups = var_1895, pad = query_35_pad_0, pad_type = query_35_pad_type_0, strides = var_2017, weight = layers_8_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_105_cast_fp16)[name = tensor("query_35_cast_fp16")]; tensor var_2023 = const()[name = tensor("op_2023"), val = tensor([1, 1])]; tensor var_2025 = const()[name = tensor("op_2025"), val = tensor([1, 1])]; tensor key_35_pad_type_0 = const()[name = tensor("key_35_pad_type_0"), val = tensor("custom")]; tensor key_35_pad_0 = const()[name = tensor("key_35_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_8_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(294726080))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295954944))), name = tensor("layers_8_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_35_cast_fp16 = conv(dilations = var_2025, groups = var_1895, pad = key_35_pad_0, pad_type = key_35_pad_type_0, strides = var_2023, weight = layers_8_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_35_cast_fp16")]; tensor var_2030 = const()[name = tensor("op_2030"), val = tensor([1, 1])]; tensor var_2032 = const()[name = tensor("op_2032"), val = tensor([1, 1])]; tensor value_35_pad_type_0 = const()[name = tensor("value_35_pad_type_0"), val = tensor("custom")]; tensor value_35_pad_0 = const()[name = tensor("value_35_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_8_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295955136))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297593600))), name = tensor("layers_8_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_8_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_8_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297594176)))]; tensor value_35_cast_fp16 = conv(bias = layers_8_encoder_attn_v_proj_bias_to_fp16, dilations = var_2032, groups = var_1895, pad = value_35_pad_0, pad_type = value_35_pad_type_0, strides = var_2030, weight = layers_8_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_35_cast_fp16")]; tensor var_2036 = const()[name = tensor("op_2036"), val = tensor([1, 20, 64, -1])]; tensor var_2037_cast_fp16 = reshape(shape = var_2036, x = query_35_cast_fp16)[name = tensor("op_2037_cast_fp16")]; tensor var_2038_to_fp16 = const()[name = tensor("op_2038_to_fp16"), val = tensor(0x1p-3)]; tensor var_2039_cast_fp16 = mul(x = var_2037_cast_fp16, y = var_2038_to_fp16)[name = tensor("op_2039_cast_fp16")]; tensor var_2040 = const()[name = tensor("op_2040"), val = tensor([1, 20, 64, -1])]; tensor var_2041_cast_fp16 = reshape(shape = var_2040, x = key_35_cast_fp16)[name = tensor("op_2041_cast_fp16")]; tensor mh_w_53_transpose_x_0 = const()[name = tensor("mh_w_53_transpose_x_0"), val = tensor(true)]; tensor mh_w_53_transpose_y_0 = const()[name = tensor("mh_w_53_transpose_y_0"), val = tensor(false)]; tensor mh_w_53_cast_fp16 = matmul(transpose_x = mh_w_53_transpose_x_0, transpose_y = mh_w_53_transpose_y_0, x = var_2039_cast_fp16, y = var_2041_cast_fp16)[name = tensor("mh_w_53_cast_fp16")]; tensor var_2044_cast_fp16 = softmax(axis = var_1888, x = mh_w_53_cast_fp16)[name = tensor("op_2044_cast_fp16")]; tensor var_2045 = const()[name = tensor("op_2045"), val = tensor([1, 20, 64, -1])]; tensor var_2046_cast_fp16 = reshape(shape = var_2045, x = value_35_cast_fp16)[name = tensor("op_2046_cast_fp16")]; tensor attn_35_transpose_x_0 = const()[name = tensor("attn_35_transpose_x_0"), val = tensor(false)]; tensor attn_35_transpose_y_0 = const()[name = tensor("attn_35_transpose_y_0"), val = tensor(true)]; tensor attn_35_cast_fp16 = matmul(transpose_x = attn_35_transpose_x_0, transpose_y = attn_35_transpose_y_0, x = var_2046_cast_fp16, y = var_2044_cast_fp16)[name = tensor("attn_35_cast_fp16")]; tensor var_2049 = const()[name = tensor("op_2049"), val = tensor([1, 1280, 1, -1])]; tensor input_83_cast_fp16 = reshape(shape = var_2049, x = attn_35_cast_fp16)[name = tensor("input_83_cast_fp16")]; tensor var_2053 = const()[name = tensor("op_2053"), val = tensor([1, 1])]; tensor var_2055 = const()[name = tensor("op_2055"), val = tensor([1, 1])]; tensor obj_107_pad_type_0 = const()[name = tensor("obj_107_pad_type_0"), val = tensor("custom")]; tensor obj_107_pad_0 = const()[name = tensor("obj_107_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_8_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(297596800))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(298825664))), name = tensor("layers_8_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_8_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_8_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(298825856)))]; tensor obj_107_cast_fp16 = conv(bias = layers_8_encoder_attn_o_proj_bias_to_fp16, dilations = var_2055, groups = var_1895, pad = obj_107_pad_0, pad_type = obj_107_pad_type_0, strides = var_2053, weight = layers_8_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_83_cast_fp16)[name = tensor("obj_107_cast_fp16")]; tensor inputs_53_cast_fp16 = add(x = inputs_51_cast_fp16, y = obj_107_cast_fp16)[name = tensor("inputs_53_cast_fp16")]; tensor var_2061 = const()[name = tensor("op_2061"), val = tensor([1])]; tensor channels_mean_53_cast_fp16 = reduce_mean(axes = var_2061, keep_dims = var_1896, x = inputs_53_cast_fp16)[name = tensor("channels_mean_53_cast_fp16")]; tensor zero_mean_53_cast_fp16 = sub(x = inputs_53_cast_fp16, y = channels_mean_53_cast_fp16)[name = tensor("zero_mean_53_cast_fp16")]; tensor zero_mean_sq_53_cast_fp16 = mul(x = zero_mean_53_cast_fp16, y = zero_mean_53_cast_fp16)[name = tensor("zero_mean_sq_53_cast_fp16")]; tensor var_2065 = const()[name = tensor("op_2065"), val = tensor([1])]; tensor var_2066_cast_fp16 = reduce_mean(axes = var_2065, keep_dims = var_1896, x = zero_mean_sq_53_cast_fp16)[name = tensor("op_2066_cast_fp16")]; tensor var_2067_to_fp16 = const()[name = tensor("op_2067_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2068_cast_fp16 = add(x = var_2066_cast_fp16, y = var_2067_to_fp16)[name = tensor("op_2068_cast_fp16")]; tensor denom_53_epsilon_0 = const()[name = tensor("denom_53_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_53_cast_fp16 = rsqrt(epsilon = denom_53_epsilon_0, x = var_2068_cast_fp16)[name = tensor("denom_53_cast_fp16")]; tensor out_53_cast_fp16 = mul(x = zero_mean_53_cast_fp16, y = denom_53_cast_fp16)[name = tensor("out_53_cast_fp16")]; tensor input_85_gamma_0_to_fp16 = const()[name = tensor("input_85_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(298828480)))]; tensor input_85_beta_0_to_fp16 = const()[name = tensor("input_85_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(298831104)))]; tensor input_85_epsilon_0_to_fp16 = const()[name = tensor("input_85_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_85_cast_fp16 = batch_norm(beta = input_85_beta_0_to_fp16, epsilon = input_85_epsilon_0_to_fp16, gamma = input_85_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_53_cast_fp16)[name = tensor("input_85_cast_fp16")]; tensor var_2079 = const()[name = tensor("op_2079"), val = tensor([1, 1])]; tensor var_2081 = const()[name = tensor("op_2081"), val = tensor([1, 1])]; tensor input_87_pad_type_0 = const()[name = tensor("input_87_pad_type_0"), val = tensor("custom")]; tensor input_87_pad_0 = const()[name = tensor("input_87_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_8_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(298833728))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303748992))), name = tensor("layers_8_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_8_fc1_bias_to_fp16 = const()[name = tensor("layers_8_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303749184)))]; tensor input_87_cast_fp16 = conv(bias = layers_8_fc1_bias_to_fp16, dilations = var_2081, groups = var_1895, pad = input_87_pad_0, pad_type = input_87_pad_type_0, strides = var_2079, weight = layers_8_fc1_weight_to_fp16_palettized, x = input_85_cast_fp16)[name = tensor("input_87_cast_fp16")]; tensor input_89_mode_0 = const()[name = tensor("input_89_mode_0"), val = tensor("EXACT")]; tensor input_89_cast_fp16 = gelu(mode = input_89_mode_0, x = input_87_cast_fp16)[name = tensor("input_89_cast_fp16")]; tensor var_2087 = const()[name = tensor("op_2087"), val = tensor([1, 1])]; tensor var_2089 = const()[name = tensor("op_2089"), val = tensor([1, 1])]; tensor hidden_states_19_pad_type_0 = const()[name = tensor("hidden_states_19_pad_type_0"), val = tensor("custom")]; tensor hidden_states_19_pad_0 = const()[name = tensor("hidden_states_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_8_fc2_weight_to_fp16 = const()[name = tensor("layers_8_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303759488)))]; tensor layers_8_fc2_bias_to_fp16 = const()[name = tensor("layers_8_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316866752)))]; tensor hidden_states_19_cast_fp16 = conv(bias = layers_8_fc2_bias_to_fp16, dilations = var_2089, groups = var_1895, pad = hidden_states_19_pad_0, pad_type = hidden_states_19_pad_type_0, strides = var_2087, weight = layers_8_fc2_weight_to_fp16, x = input_89_cast_fp16)[name = tensor("hidden_states_19_cast_fp16")]; tensor inputs_55_cast_fp16 = add(x = inputs_53_cast_fp16, y = hidden_states_19_cast_fp16)[name = tensor("inputs_55_cast_fp16")]; tensor var_2102 = const()[name = tensor("op_2102"), val = tensor(3)]; tensor var_2109 = const()[name = tensor("op_2109"), val = tensor(1)]; tensor var_2110 = const()[name = tensor("op_2110"), val = tensor(true)]; tensor var_2122 = const()[name = tensor("op_2122"), val = tensor([1])]; tensor channels_mean_55_cast_fp16 = reduce_mean(axes = var_2122, keep_dims = var_2110, x = inputs_55_cast_fp16)[name = tensor("channels_mean_55_cast_fp16")]; tensor zero_mean_55_cast_fp16 = sub(x = inputs_55_cast_fp16, y = channels_mean_55_cast_fp16)[name = tensor("zero_mean_55_cast_fp16")]; tensor zero_mean_sq_55_cast_fp16 = mul(x = zero_mean_55_cast_fp16, y = zero_mean_55_cast_fp16)[name = tensor("zero_mean_sq_55_cast_fp16")]; tensor var_2126 = const()[name = tensor("op_2126"), val = tensor([1])]; tensor var_2127_cast_fp16 = reduce_mean(axes = var_2126, keep_dims = var_2110, x = zero_mean_sq_55_cast_fp16)[name = tensor("op_2127_cast_fp16")]; tensor var_2128_to_fp16 = const()[name = tensor("op_2128_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2129_cast_fp16 = add(x = var_2127_cast_fp16, y = var_2128_to_fp16)[name = tensor("op_2129_cast_fp16")]; tensor denom_55_epsilon_0 = const()[name = tensor("denom_55_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_55_cast_fp16 = rsqrt(epsilon = denom_55_epsilon_0, x = var_2129_cast_fp16)[name = tensor("denom_55_cast_fp16")]; tensor out_55_cast_fp16 = mul(x = zero_mean_55_cast_fp16, y = denom_55_cast_fp16)[name = tensor("out_55_cast_fp16")]; tensor obj_109_gamma_0_to_fp16 = const()[name = tensor("obj_109_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316869376)))]; tensor obj_109_beta_0_to_fp16 = const()[name = tensor("obj_109_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316872000)))]; tensor obj_109_epsilon_0_to_fp16 = const()[name = tensor("obj_109_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_109_cast_fp16 = batch_norm(beta = obj_109_beta_0_to_fp16, epsilon = obj_109_epsilon_0_to_fp16, gamma = obj_109_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_55_cast_fp16)[name = tensor("obj_109_cast_fp16")]; tensor var_2144 = const()[name = tensor("op_2144"), val = tensor([1, 1])]; tensor var_2146 = const()[name = tensor("op_2146"), val = tensor([1, 1])]; tensor query_37_pad_type_0 = const()[name = tensor("query_37_pad_type_0"), val = tensor("custom")]; tensor query_37_pad_0 = const()[name = tensor("query_37_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_9_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316874624))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(318103488))), name = tensor("layers_9_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_9_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_9_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(318103680)))]; tensor query_37_cast_fp16 = conv(bias = layers_9_self_attn_q_proj_bias_to_fp16, dilations = var_2146, groups = var_2109, pad = query_37_pad_0, pad_type = query_37_pad_type_0, strides = var_2144, weight = layers_9_self_attn_q_proj_weight_to_fp16_palettized, x = obj_109_cast_fp16)[name = tensor("query_37_cast_fp16")]; tensor var_2150 = const()[name = tensor("op_2150"), val = tensor([1, 1])]; tensor var_2152 = const()[name = tensor("op_2152"), val = tensor([1, 1])]; tensor current_key_19_pad_type_0 = const()[name = tensor("current_key_19_pad_type_0"), val = tensor("custom")]; tensor current_key_19_pad_0 = const()[name = tensor("current_key_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_9_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(318106304))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(318925568))), name = tensor("layers_9_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_19_cast_fp16 = conv(dilations = var_2152, groups = var_2109, pad = current_key_19_pad_0, pad_type = current_key_19_pad_type_0, strides = var_2150, weight = layers_9_self_attn_k_proj_weight_to_fp16_palettized, x = obj_109_cast_fp16)[name = tensor("current_key_19_cast_fp16")]; tensor var_2157 = const()[name = tensor("op_2157"), val = tensor([1, 1])]; tensor var_2159 = const()[name = tensor("op_2159"), val = tensor([1, 1])]; tensor current_value_19_pad_type_0 = const()[name = tensor("current_value_19_pad_type_0"), val = tensor("custom")]; tensor current_value_19_pad_0 = const()[name = tensor("current_value_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_9_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(318925696))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(319744960))), name = tensor("layers_9_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_9_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_9_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(319745088)))]; tensor current_value_19_cast_fp16 = conv(bias = layers_9_self_attn_v_proj_bias_to_fp16, dilations = var_2159, groups = var_2109, pad = current_value_19_pad_0, pad_type = current_value_19_pad_type_0, strides = var_2157, weight = layers_9_self_attn_v_proj_weight_to_fp16_palettized, x = obj_109_cast_fp16)[name = tensor("current_value_19_cast_fp16")]; tensor var_2166_cast_fp16 = mul(x = current_key_19_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_2166_cast_fp16")]; tensor var_2168_cast_fp16 = mul(x = var_103_cast_fp16_9, y = var_241_cast_fp16)[name = tensor("op_2168_cast_fp16")]; tensor key_37_cast_fp16 = add(x = var_2166_cast_fp16, y = var_2168_cast_fp16)[name = tensor("key_37_cast_fp16")]; tensor var_2170_cast_fp16 = mul(x = current_value_19_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_2170_cast_fp16")]; tensor var_2172_cast_fp16 = mul(x = var_138_cast_fp16_9, y = var_241_cast_fp16)[name = tensor("op_2172_cast_fp16")]; tensor value_37_cast_fp16 = add(x = var_2170_cast_fp16, y = var_2172_cast_fp16)[name = tensor("value_37_cast_fp16")]; tensor var_2175 = const()[name = tensor("op_2175"), val = tensor([1, 20, 64, -1])]; tensor var_2176_cast_fp16 = reshape(shape = var_2175, x = query_37_cast_fp16)[name = tensor("op_2176_cast_fp16")]; tensor var_2177_to_fp16 = const()[name = tensor("op_2177_to_fp16"), val = tensor(0x1p-3)]; tensor var_2178_cast_fp16 = mul(x = var_2176_cast_fp16, y = var_2177_to_fp16)[name = tensor("op_2178_cast_fp16")]; tensor var_2179 = const()[name = tensor("op_2179"), val = tensor([1, 20, 64, -1])]; tensor var_2180_cast_fp16 = reshape(shape = var_2179, x = key_37_cast_fp16)[name = tensor("op_2180_cast_fp16")]; tensor mh_w_55_transpose_x_0 = const()[name = tensor("mh_w_55_transpose_x_0"), val = tensor(true)]; tensor mh_w_55_transpose_y_0 = const()[name = tensor("mh_w_55_transpose_y_0"), val = tensor(false)]; tensor mh_w_55_cast_fp16 = matmul(transpose_x = mh_w_55_transpose_x_0, transpose_y = mh_w_55_transpose_y_0, x = var_2178_cast_fp16, y = var_2180_cast_fp16)[name = tensor("mh_w_55_cast_fp16")]; tensor mh_w_57_cast_fp16 = add(x = mh_w_55_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_57_cast_fp16")]; tensor var_2188_cast_fp16 = softmax(axis = var_2102, x = mh_w_57_cast_fp16)[name = tensor("op_2188_cast_fp16")]; tensor var_2189 = const()[name = tensor("op_2189"), val = tensor([1, 20, 64, -1])]; tensor var_2190_cast_fp16 = reshape(shape = var_2189, x = value_37_cast_fp16)[name = tensor("op_2190_cast_fp16")]; tensor attn_37_transpose_x_0 = const()[name = tensor("attn_37_transpose_x_0"), val = tensor(false)]; tensor attn_37_transpose_y_0 = const()[name = tensor("attn_37_transpose_y_0"), val = tensor(true)]; tensor attn_37_cast_fp16 = matmul(transpose_x = attn_37_transpose_x_0, transpose_y = attn_37_transpose_y_0, x = var_2190_cast_fp16, y = var_2188_cast_fp16)[name = tensor("attn_37_cast_fp16")]; tensor var_2193 = const()[name = tensor("op_2193"), val = tensor([1, 1280, 1, -1])]; tensor input_91_cast_fp16 = reshape(shape = var_2193, x = attn_37_cast_fp16)[name = tensor("input_91_cast_fp16")]; tensor var_2197 = const()[name = tensor("op_2197"), val = tensor([1, 1])]; tensor var_2199 = const()[name = tensor("op_2199"), val = tensor([1, 1])]; tensor obj_115_pad_type_0 = const()[name = tensor("obj_115_pad_type_0"), val = tensor("custom")]; tensor obj_115_pad_0 = const()[name = tensor("obj_115_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_9_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(319747712))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320976576))), name = tensor("layers_9_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_9_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_9_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320976768)))]; tensor obj_115_cast_fp16 = conv(bias = layers_9_self_attn_o_proj_bias_to_fp16, dilations = var_2199, groups = var_2109, pad = obj_115_pad_0, pad_type = obj_115_pad_type_0, strides = var_2197, weight = layers_9_self_attn_o_proj_weight_to_fp16_palettized, x = input_91_cast_fp16)[name = tensor("obj_115_cast_fp16")]; tensor inputs_57_cast_fp16 = add(x = inputs_55_cast_fp16, y = obj_115_cast_fp16)[name = tensor("inputs_57_cast_fp16")]; tensor var_2209 = const()[name = tensor("op_2209"), val = tensor([1])]; tensor channels_mean_57_cast_fp16 = reduce_mean(axes = var_2209, keep_dims = var_2110, x = inputs_57_cast_fp16)[name = tensor("channels_mean_57_cast_fp16")]; tensor zero_mean_57_cast_fp16 = sub(x = inputs_57_cast_fp16, y = channels_mean_57_cast_fp16)[name = tensor("zero_mean_57_cast_fp16")]; tensor zero_mean_sq_57_cast_fp16 = mul(x = zero_mean_57_cast_fp16, y = zero_mean_57_cast_fp16)[name = tensor("zero_mean_sq_57_cast_fp16")]; tensor var_2213 = const()[name = tensor("op_2213"), val = tensor([1])]; tensor var_2214_cast_fp16 = reduce_mean(axes = var_2213, keep_dims = var_2110, x = zero_mean_sq_57_cast_fp16)[name = tensor("op_2214_cast_fp16")]; tensor var_2215_to_fp16 = const()[name = tensor("op_2215_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2216_cast_fp16 = add(x = var_2214_cast_fp16, y = var_2215_to_fp16)[name = tensor("op_2216_cast_fp16")]; tensor denom_57_epsilon_0 = const()[name = tensor("denom_57_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_57_cast_fp16 = rsqrt(epsilon = denom_57_epsilon_0, x = var_2216_cast_fp16)[name = tensor("denom_57_cast_fp16")]; tensor out_57_cast_fp16 = mul(x = zero_mean_57_cast_fp16, y = denom_57_cast_fp16)[name = tensor("out_57_cast_fp16")]; tensor obj_117_gamma_0_to_fp16 = const()[name = tensor("obj_117_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320979392)))]; tensor obj_117_beta_0_to_fp16 = const()[name = tensor("obj_117_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320982016)))]; tensor obj_117_epsilon_0_to_fp16 = const()[name = tensor("obj_117_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_117_cast_fp16 = batch_norm(beta = obj_117_beta_0_to_fp16, epsilon = obj_117_epsilon_0_to_fp16, gamma = obj_117_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_57_cast_fp16)[name = tensor("obj_117_cast_fp16")]; tensor var_2231 = const()[name = tensor("op_2231"), val = tensor([1, 1])]; tensor var_2233 = const()[name = tensor("op_2233"), val = tensor([1, 1])]; tensor query_39_pad_type_0 = const()[name = tensor("query_39_pad_type_0"), val = tensor("custom")]; tensor query_39_pad_0 = const()[name = tensor("query_39_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_9_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320984640))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(321803904))), name = tensor("layers_9_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_9_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_9_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(321804032)))]; tensor query_39_cast_fp16 = conv(bias = layers_9_encoder_attn_q_proj_bias_to_fp16, dilations = var_2233, groups = var_2109, pad = query_39_pad_0, pad_type = query_39_pad_type_0, strides = var_2231, weight = layers_9_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_117_cast_fp16)[name = tensor("query_39_cast_fp16")]; tensor var_2237 = const()[name = tensor("op_2237"), val = tensor([1, 1])]; tensor var_2239 = const()[name = tensor("op_2239"), val = tensor([1, 1])]; tensor key_39_pad_type_0 = const()[name = tensor("key_39_pad_type_0"), val = tensor("custom")]; tensor key_39_pad_0 = const()[name = tensor("key_39_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_9_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(321806656))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(322625920))), name = tensor("layers_9_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_39_cast_fp16 = conv(dilations = var_2239, groups = var_2109, pad = key_39_pad_0, pad_type = key_39_pad_type_0, strides = var_2237, weight = layers_9_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_39_cast_fp16")]; tensor var_2244 = const()[name = tensor("op_2244"), val = tensor([1, 1])]; tensor var_2246 = const()[name = tensor("op_2246"), val = tensor([1, 1])]; tensor value_39_pad_type_0 = const()[name = tensor("value_39_pad_type_0"), val = tensor("custom")]; tensor value_39_pad_0 = const()[name = tensor("value_39_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_9_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(322626048))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(323445312))), name = tensor("layers_9_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_9_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_9_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(323445440)))]; tensor value_39_cast_fp16 = conv(bias = layers_9_encoder_attn_v_proj_bias_to_fp16, dilations = var_2246, groups = var_2109, pad = value_39_pad_0, pad_type = value_39_pad_type_0, strides = var_2244, weight = layers_9_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_39_cast_fp16")]; tensor var_2250 = const()[name = tensor("op_2250"), val = tensor([1, 20, 64, -1])]; tensor var_2251_cast_fp16 = reshape(shape = var_2250, x = query_39_cast_fp16)[name = tensor("op_2251_cast_fp16")]; tensor var_2252_to_fp16 = const()[name = tensor("op_2252_to_fp16"), val = tensor(0x1p-3)]; tensor var_2253_cast_fp16 = mul(x = var_2251_cast_fp16, y = var_2252_to_fp16)[name = tensor("op_2253_cast_fp16")]; tensor var_2254 = const()[name = tensor("op_2254"), val = tensor([1, 20, 64, -1])]; tensor var_2255_cast_fp16 = reshape(shape = var_2254, x = key_39_cast_fp16)[name = tensor("op_2255_cast_fp16")]; tensor mh_w_59_transpose_x_0 = const()[name = tensor("mh_w_59_transpose_x_0"), val = tensor(true)]; tensor mh_w_59_transpose_y_0 = const()[name = tensor("mh_w_59_transpose_y_0"), val = tensor(false)]; tensor mh_w_59_cast_fp16 = matmul(transpose_x = mh_w_59_transpose_x_0, transpose_y = mh_w_59_transpose_y_0, x = var_2253_cast_fp16, y = var_2255_cast_fp16)[name = tensor("mh_w_59_cast_fp16")]; tensor var_2258_cast_fp16 = softmax(axis = var_2102, x = mh_w_59_cast_fp16)[name = tensor("op_2258_cast_fp16")]; tensor var_2259 = const()[name = tensor("op_2259"), val = tensor([1, 20, 64, -1])]; tensor var_2260_cast_fp16 = reshape(shape = var_2259, x = value_39_cast_fp16)[name = tensor("op_2260_cast_fp16")]; tensor attn_39_transpose_x_0 = const()[name = tensor("attn_39_transpose_x_0"), val = tensor(false)]; tensor attn_39_transpose_y_0 = const()[name = tensor("attn_39_transpose_y_0"), val = tensor(true)]; tensor attn_39_cast_fp16 = matmul(transpose_x = attn_39_transpose_x_0, transpose_y = attn_39_transpose_y_0, x = var_2260_cast_fp16, y = var_2258_cast_fp16)[name = tensor("attn_39_cast_fp16")]; tensor var_2263 = const()[name = tensor("op_2263"), val = tensor([1, 1280, 1, -1])]; tensor input_93_cast_fp16 = reshape(shape = var_2263, x = attn_39_cast_fp16)[name = tensor("input_93_cast_fp16")]; tensor var_2267 = const()[name = tensor("op_2267"), val = tensor([1, 1])]; tensor var_2269 = const()[name = tensor("op_2269"), val = tensor([1, 1])]; tensor obj_119_pad_type_0 = const()[name = tensor("obj_119_pad_type_0"), val = tensor("custom")]; tensor obj_119_pad_0 = const()[name = tensor("obj_119_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_9_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(323448064))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(324676928))), name = tensor("layers_9_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_9_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_9_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(324677120)))]; tensor obj_119_cast_fp16 = conv(bias = layers_9_encoder_attn_o_proj_bias_to_fp16, dilations = var_2269, groups = var_2109, pad = obj_119_pad_0, pad_type = obj_119_pad_type_0, strides = var_2267, weight = layers_9_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_93_cast_fp16)[name = tensor("obj_119_cast_fp16")]; tensor inputs_59_cast_fp16 = add(x = inputs_57_cast_fp16, y = obj_119_cast_fp16)[name = tensor("inputs_59_cast_fp16")]; tensor var_2275 = const()[name = tensor("op_2275"), val = tensor([1])]; tensor channels_mean_59_cast_fp16 = reduce_mean(axes = var_2275, keep_dims = var_2110, x = inputs_59_cast_fp16)[name = tensor("channels_mean_59_cast_fp16")]; tensor zero_mean_59_cast_fp16 = sub(x = inputs_59_cast_fp16, y = channels_mean_59_cast_fp16)[name = tensor("zero_mean_59_cast_fp16")]; tensor zero_mean_sq_59_cast_fp16 = mul(x = zero_mean_59_cast_fp16, y = zero_mean_59_cast_fp16)[name = tensor("zero_mean_sq_59_cast_fp16")]; tensor var_2279 = const()[name = tensor("op_2279"), val = tensor([1])]; tensor var_2280_cast_fp16 = reduce_mean(axes = var_2279, keep_dims = var_2110, x = zero_mean_sq_59_cast_fp16)[name = tensor("op_2280_cast_fp16")]; tensor var_2281_to_fp16 = const()[name = tensor("op_2281_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2282_cast_fp16 = add(x = var_2280_cast_fp16, y = var_2281_to_fp16)[name = tensor("op_2282_cast_fp16")]; tensor denom_59_epsilon_0 = const()[name = tensor("denom_59_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_59_cast_fp16 = rsqrt(epsilon = denom_59_epsilon_0, x = var_2282_cast_fp16)[name = tensor("denom_59_cast_fp16")]; tensor out_59_cast_fp16 = mul(x = zero_mean_59_cast_fp16, y = denom_59_cast_fp16)[name = tensor("out_59_cast_fp16")]; tensor input_95_gamma_0_to_fp16 = const()[name = tensor("input_95_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(324679744)))]; tensor input_95_beta_0_to_fp16 = const()[name = tensor("input_95_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(324682368)))]; tensor input_95_epsilon_0_to_fp16 = const()[name = tensor("input_95_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_95_cast_fp16 = batch_norm(beta = input_95_beta_0_to_fp16, epsilon = input_95_epsilon_0_to_fp16, gamma = input_95_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_59_cast_fp16)[name = tensor("input_95_cast_fp16")]; tensor var_2293 = const()[name = tensor("op_2293"), val = tensor([1, 1])]; tensor var_2295 = const()[name = tensor("op_2295"), val = tensor([1, 1])]; tensor input_97_pad_type_0 = const()[name = tensor("input_97_pad_type_0"), val = tensor("custom")]; tensor input_97_pad_0 = const()[name = tensor("input_97_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_9_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(324684992))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329600256))), name = tensor("layers_9_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_9_fc1_bias_to_fp16 = const()[name = tensor("layers_9_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329600448)))]; tensor input_97_cast_fp16 = conv(bias = layers_9_fc1_bias_to_fp16, dilations = var_2295, groups = var_2109, pad = input_97_pad_0, pad_type = input_97_pad_type_0, strides = var_2293, weight = layers_9_fc1_weight_to_fp16_palettized, x = input_95_cast_fp16)[name = tensor("input_97_cast_fp16")]; tensor input_99_mode_0 = const()[name = tensor("input_99_mode_0"), val = tensor("EXACT")]; tensor input_99_cast_fp16 = gelu(mode = input_99_mode_0, x = input_97_cast_fp16)[name = tensor("input_99_cast_fp16")]; tensor var_2301 = const()[name = tensor("op_2301"), val = tensor([1, 1])]; tensor var_2303 = const()[name = tensor("op_2303"), val = tensor([1, 1])]; tensor hidden_states_21_pad_type_0 = const()[name = tensor("hidden_states_21_pad_type_0"), val = tensor("custom")]; tensor hidden_states_21_pad_0 = const()[name = tensor("hidden_states_21_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_9_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(329610752))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(336164416))), name = tensor("layers_9_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_9_fc2_bias_to_fp16 = const()[name = tensor("layers_9_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(336164992)))]; tensor hidden_states_21_cast_fp16 = conv(bias = layers_9_fc2_bias_to_fp16, dilations = var_2303, groups = var_2109, pad = hidden_states_21_pad_0, pad_type = hidden_states_21_pad_type_0, strides = var_2301, weight = layers_9_fc2_weight_to_fp16_palettized, x = input_99_cast_fp16)[name = tensor("hidden_states_21_cast_fp16")]; tensor inputs_61_cast_fp16 = add(x = inputs_59_cast_fp16, y = hidden_states_21_cast_fp16)[name = tensor("inputs_61_cast_fp16")]; tensor var_2316 = const()[name = tensor("op_2316"), val = tensor(3)]; tensor var_2323 = const()[name = tensor("op_2323"), val = tensor(1)]; tensor var_2324 = const()[name = tensor("op_2324"), val = tensor(true)]; tensor var_2336 = const()[name = tensor("op_2336"), val = tensor([1])]; tensor channels_mean_61_cast_fp16 = reduce_mean(axes = var_2336, keep_dims = var_2324, x = inputs_61_cast_fp16)[name = tensor("channels_mean_61_cast_fp16")]; tensor zero_mean_61_cast_fp16 = sub(x = inputs_61_cast_fp16, y = channels_mean_61_cast_fp16)[name = tensor("zero_mean_61_cast_fp16")]; tensor zero_mean_sq_61_cast_fp16 = mul(x = zero_mean_61_cast_fp16, y = zero_mean_61_cast_fp16)[name = tensor("zero_mean_sq_61_cast_fp16")]; tensor var_2340 = const()[name = tensor("op_2340"), val = tensor([1])]; tensor var_2341_cast_fp16 = reduce_mean(axes = var_2340, keep_dims = var_2324, x = zero_mean_sq_61_cast_fp16)[name = tensor("op_2341_cast_fp16")]; tensor var_2342_to_fp16 = const()[name = tensor("op_2342_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2343_cast_fp16 = add(x = var_2341_cast_fp16, y = var_2342_to_fp16)[name = tensor("op_2343_cast_fp16")]; tensor denom_61_epsilon_0 = const()[name = tensor("denom_61_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_61_cast_fp16 = rsqrt(epsilon = denom_61_epsilon_0, x = var_2343_cast_fp16)[name = tensor("denom_61_cast_fp16")]; tensor out_61_cast_fp16 = mul(x = zero_mean_61_cast_fp16, y = denom_61_cast_fp16)[name = tensor("out_61_cast_fp16")]; tensor obj_121_gamma_0_to_fp16 = const()[name = tensor("obj_121_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(336167616)))]; tensor obj_121_beta_0_to_fp16 = const()[name = tensor("obj_121_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(336170240)))]; tensor obj_121_epsilon_0_to_fp16 = const()[name = tensor("obj_121_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_121_cast_fp16 = batch_norm(beta = obj_121_beta_0_to_fp16, epsilon = obj_121_epsilon_0_to_fp16, gamma = obj_121_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_61_cast_fp16)[name = tensor("obj_121_cast_fp16")]; tensor var_2358 = const()[name = tensor("op_2358"), val = tensor([1, 1])]; tensor var_2360 = const()[name = tensor("op_2360"), val = tensor([1, 1])]; tensor query_41_pad_type_0 = const()[name = tensor("query_41_pad_type_0"), val = tensor("custom")]; tensor query_41_pad_0 = const()[name = tensor("query_41_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_10_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(336172864))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337401728))), name = tensor("layers_10_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_10_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_10_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337401920)))]; tensor query_41_cast_fp16 = conv(bias = layers_10_self_attn_q_proj_bias_to_fp16, dilations = var_2360, groups = var_2323, pad = query_41_pad_0, pad_type = query_41_pad_type_0, strides = var_2358, weight = layers_10_self_attn_q_proj_weight_to_fp16_palettized, x = obj_121_cast_fp16)[name = tensor("query_41_cast_fp16")]; tensor var_2364 = const()[name = tensor("op_2364"), val = tensor([1, 1])]; tensor var_2366 = const()[name = tensor("op_2366"), val = tensor([1, 1])]; tensor current_key_21_pad_type_0 = const()[name = tensor("current_key_21_pad_type_0"), val = tensor("custom")]; tensor current_key_21_pad_0 = const()[name = tensor("current_key_21_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_10_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337404544))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339043008))), name = tensor("layers_10_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_21_cast_fp16 = conv(dilations = var_2366, groups = var_2323, pad = current_key_21_pad_0, pad_type = current_key_21_pad_type_0, strides = var_2364, weight = layers_10_self_attn_k_proj_weight_to_fp16_palettized, x = obj_121_cast_fp16)[name = tensor("current_key_21_cast_fp16")]; tensor var_2371 = const()[name = tensor("op_2371"), val = tensor([1, 1])]; tensor var_2373 = const()[name = tensor("op_2373"), val = tensor([1, 1])]; tensor current_value_21_pad_type_0 = const()[name = tensor("current_value_21_pad_type_0"), val = tensor("custom")]; tensor current_value_21_pad_0 = const()[name = tensor("current_value_21_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_10_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339043584))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(340272448))), name = tensor("layers_10_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_10_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_10_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(340272640)))]; tensor current_value_21_cast_fp16 = conv(bias = layers_10_self_attn_v_proj_bias_to_fp16, dilations = var_2373, groups = var_2323, pad = current_value_21_pad_0, pad_type = current_value_21_pad_type_0, strides = var_2371, weight = layers_10_self_attn_v_proj_weight_to_fp16_palettized, x = obj_121_cast_fp16)[name = tensor("current_value_21_cast_fp16")]; tensor var_2380_cast_fp16 = mul(x = current_key_21_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_2380_cast_fp16")]; tensor var_2382_cast_fp16 = mul(x = var_103_cast_fp16_10, y = var_241_cast_fp16)[name = tensor("op_2382_cast_fp16")]; tensor key_41_cast_fp16 = add(x = var_2380_cast_fp16, y = var_2382_cast_fp16)[name = tensor("key_41_cast_fp16")]; tensor var_2384_cast_fp16 = mul(x = current_value_21_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_2384_cast_fp16")]; tensor var_2386_cast_fp16 = mul(x = var_138_cast_fp16_10, y = var_241_cast_fp16)[name = tensor("op_2386_cast_fp16")]; tensor value_41_cast_fp16 = add(x = var_2384_cast_fp16, y = var_2386_cast_fp16)[name = tensor("value_41_cast_fp16")]; tensor var_2389 = const()[name = tensor("op_2389"), val = tensor([1, 20, 64, -1])]; tensor var_2390_cast_fp16 = reshape(shape = var_2389, x = query_41_cast_fp16)[name = tensor("op_2390_cast_fp16")]; tensor var_2391_to_fp16 = const()[name = tensor("op_2391_to_fp16"), val = tensor(0x1p-3)]; tensor var_2392_cast_fp16 = mul(x = var_2390_cast_fp16, y = var_2391_to_fp16)[name = tensor("op_2392_cast_fp16")]; tensor var_2393 = const()[name = tensor("op_2393"), val = tensor([1, 20, 64, -1])]; tensor var_2394_cast_fp16 = reshape(shape = var_2393, x = key_41_cast_fp16)[name = tensor("op_2394_cast_fp16")]; tensor mh_w_61_transpose_x_0 = const()[name = tensor("mh_w_61_transpose_x_0"), val = tensor(true)]; tensor mh_w_61_transpose_y_0 = const()[name = tensor("mh_w_61_transpose_y_0"), val = tensor(false)]; tensor mh_w_61_cast_fp16 = matmul(transpose_x = mh_w_61_transpose_x_0, transpose_y = mh_w_61_transpose_y_0, x = var_2392_cast_fp16, y = var_2394_cast_fp16)[name = tensor("mh_w_61_cast_fp16")]; tensor mh_w_63_cast_fp16 = add(x = mh_w_61_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_63_cast_fp16")]; tensor var_2402_cast_fp16 = softmax(axis = var_2316, x = mh_w_63_cast_fp16)[name = tensor("op_2402_cast_fp16")]; tensor var_2403 = const()[name = tensor("op_2403"), val = tensor([1, 20, 64, -1])]; tensor var_2404_cast_fp16 = reshape(shape = var_2403, x = value_41_cast_fp16)[name = tensor("op_2404_cast_fp16")]; tensor attn_41_transpose_x_0 = const()[name = tensor("attn_41_transpose_x_0"), val = tensor(false)]; tensor attn_41_transpose_y_0 = const()[name = tensor("attn_41_transpose_y_0"), val = tensor(true)]; tensor attn_41_cast_fp16 = matmul(transpose_x = attn_41_transpose_x_0, transpose_y = attn_41_transpose_y_0, x = var_2404_cast_fp16, y = var_2402_cast_fp16)[name = tensor("attn_41_cast_fp16")]; tensor var_2407 = const()[name = tensor("op_2407"), val = tensor([1, 1280, 1, -1])]; tensor input_101_cast_fp16 = reshape(shape = var_2407, x = attn_41_cast_fp16)[name = tensor("input_101_cast_fp16")]; tensor var_2411 = const()[name = tensor("op_2411"), val = tensor([1, 1])]; tensor var_2413 = const()[name = tensor("op_2413"), val = tensor([1, 1])]; tensor obj_127_pad_type_0 = const()[name = tensor("obj_127_pad_type_0"), val = tensor("custom")]; tensor obj_127_pad_0 = const()[name = tensor("obj_127_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_10_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(340275264))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341504128))), name = tensor("layers_10_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_10_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_10_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341504320)))]; tensor obj_127_cast_fp16 = conv(bias = layers_10_self_attn_o_proj_bias_to_fp16, dilations = var_2413, groups = var_2323, pad = obj_127_pad_0, pad_type = obj_127_pad_type_0, strides = var_2411, weight = layers_10_self_attn_o_proj_weight_to_fp16_palettized, x = input_101_cast_fp16)[name = tensor("obj_127_cast_fp16")]; tensor inputs_63_cast_fp16 = add(x = inputs_61_cast_fp16, y = obj_127_cast_fp16)[name = tensor("inputs_63_cast_fp16")]; tensor var_2423 = const()[name = tensor("op_2423"), val = tensor([1])]; tensor channels_mean_63_cast_fp16 = reduce_mean(axes = var_2423, keep_dims = var_2324, x = inputs_63_cast_fp16)[name = tensor("channels_mean_63_cast_fp16")]; tensor zero_mean_63_cast_fp16 = sub(x = inputs_63_cast_fp16, y = channels_mean_63_cast_fp16)[name = tensor("zero_mean_63_cast_fp16")]; tensor zero_mean_sq_63_cast_fp16 = mul(x = zero_mean_63_cast_fp16, y = zero_mean_63_cast_fp16)[name = tensor("zero_mean_sq_63_cast_fp16")]; tensor var_2427 = const()[name = tensor("op_2427"), val = tensor([1])]; tensor var_2428_cast_fp16 = reduce_mean(axes = var_2427, keep_dims = var_2324, x = zero_mean_sq_63_cast_fp16)[name = tensor("op_2428_cast_fp16")]; tensor var_2429_to_fp16 = const()[name = tensor("op_2429_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2430_cast_fp16 = add(x = var_2428_cast_fp16, y = var_2429_to_fp16)[name = tensor("op_2430_cast_fp16")]; tensor denom_63_epsilon_0 = const()[name = tensor("denom_63_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_63_cast_fp16 = rsqrt(epsilon = denom_63_epsilon_0, x = var_2430_cast_fp16)[name = tensor("denom_63_cast_fp16")]; tensor out_63_cast_fp16 = mul(x = zero_mean_63_cast_fp16, y = denom_63_cast_fp16)[name = tensor("out_63_cast_fp16")]; tensor obj_129_gamma_0_to_fp16 = const()[name = tensor("obj_129_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341506944)))]; tensor obj_129_beta_0_to_fp16 = const()[name = tensor("obj_129_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341509568)))]; tensor obj_129_epsilon_0_to_fp16 = const()[name = tensor("obj_129_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_129_cast_fp16 = batch_norm(beta = obj_129_beta_0_to_fp16, epsilon = obj_129_epsilon_0_to_fp16, gamma = obj_129_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_63_cast_fp16)[name = tensor("obj_129_cast_fp16")]; tensor var_2445 = const()[name = tensor("op_2445"), val = tensor([1, 1])]; tensor var_2447 = const()[name = tensor("op_2447"), val = tensor([1, 1])]; tensor query_43_pad_type_0 = const()[name = tensor("query_43_pad_type_0"), val = tensor("custom")]; tensor query_43_pad_0 = const()[name = tensor("query_43_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_10_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341512192))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(342331456))), name = tensor("layers_10_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_10_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_10_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(342331584)))]; tensor query_43_cast_fp16 = conv(bias = layers_10_encoder_attn_q_proj_bias_to_fp16, dilations = var_2447, groups = var_2323, pad = query_43_pad_0, pad_type = query_43_pad_type_0, strides = var_2445, weight = layers_10_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_129_cast_fp16)[name = tensor("query_43_cast_fp16")]; tensor var_2451 = const()[name = tensor("op_2451"), val = tensor([1, 1])]; tensor var_2453 = const()[name = tensor("op_2453"), val = tensor([1, 1])]; tensor key_43_pad_type_0 = const()[name = tensor("key_43_pad_type_0"), val = tensor("custom")]; tensor key_43_pad_0 = const()[name = tensor("key_43_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_10_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(342334208))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(343153472))), name = tensor("layers_10_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_43_cast_fp16 = conv(dilations = var_2453, groups = var_2323, pad = key_43_pad_0, pad_type = key_43_pad_type_0, strides = var_2451, weight = layers_10_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_43_cast_fp16")]; tensor var_2458 = const()[name = tensor("op_2458"), val = tensor([1, 1])]; tensor var_2460 = const()[name = tensor("op_2460"), val = tensor([1, 1])]; tensor value_43_pad_type_0 = const()[name = tensor("value_43_pad_type_0"), val = tensor("custom")]; tensor value_43_pad_0 = const()[name = tensor("value_43_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_10_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(343153600))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(343972864))), name = tensor("layers_10_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_10_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_10_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(343972992)))]; tensor value_43_cast_fp16 = conv(bias = layers_10_encoder_attn_v_proj_bias_to_fp16, dilations = var_2460, groups = var_2323, pad = value_43_pad_0, pad_type = value_43_pad_type_0, strides = var_2458, weight = layers_10_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_43_cast_fp16")]; tensor var_2464 = const()[name = tensor("op_2464"), val = tensor([1, 20, 64, -1])]; tensor var_2465_cast_fp16 = reshape(shape = var_2464, x = query_43_cast_fp16)[name = tensor("op_2465_cast_fp16")]; tensor var_2466_to_fp16 = const()[name = tensor("op_2466_to_fp16"), val = tensor(0x1p-3)]; tensor var_2467_cast_fp16 = mul(x = var_2465_cast_fp16, y = var_2466_to_fp16)[name = tensor("op_2467_cast_fp16")]; tensor var_2468 = const()[name = tensor("op_2468"), val = tensor([1, 20, 64, -1])]; tensor var_2469_cast_fp16 = reshape(shape = var_2468, x = key_43_cast_fp16)[name = tensor("op_2469_cast_fp16")]; tensor mh_w_65_transpose_x_0 = const()[name = tensor("mh_w_65_transpose_x_0"), val = tensor(true)]; tensor mh_w_65_transpose_y_0 = const()[name = tensor("mh_w_65_transpose_y_0"), val = tensor(false)]; tensor mh_w_65_cast_fp16 = matmul(transpose_x = mh_w_65_transpose_x_0, transpose_y = mh_w_65_transpose_y_0, x = var_2467_cast_fp16, y = var_2469_cast_fp16)[name = tensor("mh_w_65_cast_fp16")]; tensor var_2472_cast_fp16 = softmax(axis = var_2316, x = mh_w_65_cast_fp16)[name = tensor("op_2472_cast_fp16")]; tensor var_2473 = const()[name = tensor("op_2473"), val = tensor([1, 20, 64, -1])]; tensor var_2474_cast_fp16 = reshape(shape = var_2473, x = value_43_cast_fp16)[name = tensor("op_2474_cast_fp16")]; tensor attn_43_transpose_x_0 = const()[name = tensor("attn_43_transpose_x_0"), val = tensor(false)]; tensor attn_43_transpose_y_0 = const()[name = tensor("attn_43_transpose_y_0"), val = tensor(true)]; tensor attn_43_cast_fp16 = matmul(transpose_x = attn_43_transpose_x_0, transpose_y = attn_43_transpose_y_0, x = var_2474_cast_fp16, y = var_2472_cast_fp16)[name = tensor("attn_43_cast_fp16")]; tensor var_2477 = const()[name = tensor("op_2477"), val = tensor([1, 1280, 1, -1])]; tensor input_103_cast_fp16 = reshape(shape = var_2477, x = attn_43_cast_fp16)[name = tensor("input_103_cast_fp16")]; tensor var_2481 = const()[name = tensor("op_2481"), val = tensor([1, 1])]; tensor var_2483 = const()[name = tensor("op_2483"), val = tensor([1, 1])]; tensor obj_131_pad_type_0 = const()[name = tensor("obj_131_pad_type_0"), val = tensor("custom")]; tensor obj_131_pad_0 = const()[name = tensor("obj_131_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_10_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(343975616))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345204480))), name = tensor("layers_10_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_10_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_10_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345204672)))]; tensor obj_131_cast_fp16 = conv(bias = layers_10_encoder_attn_o_proj_bias_to_fp16, dilations = var_2483, groups = var_2323, pad = obj_131_pad_0, pad_type = obj_131_pad_type_0, strides = var_2481, weight = layers_10_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_103_cast_fp16)[name = tensor("obj_131_cast_fp16")]; tensor inputs_65_cast_fp16 = add(x = inputs_63_cast_fp16, y = obj_131_cast_fp16)[name = tensor("inputs_65_cast_fp16")]; tensor var_2489 = const()[name = tensor("op_2489"), val = tensor([1])]; tensor channels_mean_65_cast_fp16 = reduce_mean(axes = var_2489, keep_dims = var_2324, x = inputs_65_cast_fp16)[name = tensor("channels_mean_65_cast_fp16")]; tensor zero_mean_65_cast_fp16 = sub(x = inputs_65_cast_fp16, y = channels_mean_65_cast_fp16)[name = tensor("zero_mean_65_cast_fp16")]; tensor zero_mean_sq_65_cast_fp16 = mul(x = zero_mean_65_cast_fp16, y = zero_mean_65_cast_fp16)[name = tensor("zero_mean_sq_65_cast_fp16")]; tensor var_2493 = const()[name = tensor("op_2493"), val = tensor([1])]; tensor var_2494_cast_fp16 = reduce_mean(axes = var_2493, keep_dims = var_2324, x = zero_mean_sq_65_cast_fp16)[name = tensor("op_2494_cast_fp16")]; tensor var_2495_to_fp16 = const()[name = tensor("op_2495_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2496_cast_fp16 = add(x = var_2494_cast_fp16, y = var_2495_to_fp16)[name = tensor("op_2496_cast_fp16")]; tensor denom_65_epsilon_0 = const()[name = tensor("denom_65_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_65_cast_fp16 = rsqrt(epsilon = denom_65_epsilon_0, x = var_2496_cast_fp16)[name = tensor("denom_65_cast_fp16")]; tensor out_65_cast_fp16 = mul(x = zero_mean_65_cast_fp16, y = denom_65_cast_fp16)[name = tensor("out_65_cast_fp16")]; tensor input_105_gamma_0_to_fp16 = const()[name = tensor("input_105_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345207296)))]; tensor input_105_beta_0_to_fp16 = const()[name = tensor("input_105_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345209920)))]; tensor input_105_epsilon_0_to_fp16 = const()[name = tensor("input_105_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_105_cast_fp16 = batch_norm(beta = input_105_beta_0_to_fp16, epsilon = input_105_epsilon_0_to_fp16, gamma = input_105_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_65_cast_fp16)[name = tensor("input_105_cast_fp16")]; tensor var_2507 = const()[name = tensor("op_2507"), val = tensor([1, 1])]; tensor var_2509 = const()[name = tensor("op_2509"), val = tensor([1, 1])]; tensor input_107_pad_type_0 = const()[name = tensor("input_107_pad_type_0"), val = tensor("custom")]; tensor input_107_pad_0 = const()[name = tensor("input_107_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_10_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345212544))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350127808))), name = tensor("layers_10_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_10_fc1_bias_to_fp16 = const()[name = tensor("layers_10_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350128000)))]; tensor input_107_cast_fp16 = conv(bias = layers_10_fc1_bias_to_fp16, dilations = var_2509, groups = var_2323, pad = input_107_pad_0, pad_type = input_107_pad_type_0, strides = var_2507, weight = layers_10_fc1_weight_to_fp16_palettized, x = input_105_cast_fp16)[name = tensor("input_107_cast_fp16")]; tensor input_109_mode_0 = const()[name = tensor("input_109_mode_0"), val = tensor("EXACT")]; tensor input_109_cast_fp16 = gelu(mode = input_109_mode_0, x = input_107_cast_fp16)[name = tensor("input_109_cast_fp16")]; tensor var_2515 = const()[name = tensor("op_2515"), val = tensor([1, 1])]; tensor var_2517 = const()[name = tensor("op_2517"), val = tensor([1, 1])]; tensor hidden_states_23_pad_type_0 = const()[name = tensor("hidden_states_23_pad_type_0"), val = tensor("custom")]; tensor hidden_states_23_pad_0 = const()[name = tensor("hidden_states_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_10_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350138304))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(355053568))), name = tensor("layers_10_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_10_fc2_bias_to_fp16 = const()[name = tensor("layers_10_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(355053760)))]; tensor hidden_states_23_cast_fp16 = conv(bias = layers_10_fc2_bias_to_fp16, dilations = var_2517, groups = var_2323, pad = hidden_states_23_pad_0, pad_type = hidden_states_23_pad_type_0, strides = var_2515, weight = layers_10_fc2_weight_to_fp16_palettized, x = input_109_cast_fp16)[name = tensor("hidden_states_23_cast_fp16")]; tensor inputs_67_cast_fp16 = add(x = inputs_65_cast_fp16, y = hidden_states_23_cast_fp16)[name = tensor("inputs_67_cast_fp16")]; tensor var_2530 = const()[name = tensor("op_2530"), val = tensor(3)]; tensor var_2537 = const()[name = tensor("op_2537"), val = tensor(1)]; tensor var_2538 = const()[name = tensor("op_2538"), val = tensor(true)]; tensor var_2550 = const()[name = tensor("op_2550"), val = tensor([1])]; tensor channels_mean_67_cast_fp16 = reduce_mean(axes = var_2550, keep_dims = var_2538, x = inputs_67_cast_fp16)[name = tensor("channels_mean_67_cast_fp16")]; tensor zero_mean_67_cast_fp16 = sub(x = inputs_67_cast_fp16, y = channels_mean_67_cast_fp16)[name = tensor("zero_mean_67_cast_fp16")]; tensor zero_mean_sq_67_cast_fp16 = mul(x = zero_mean_67_cast_fp16, y = zero_mean_67_cast_fp16)[name = tensor("zero_mean_sq_67_cast_fp16")]; tensor var_2554 = const()[name = tensor("op_2554"), val = tensor([1])]; tensor var_2555_cast_fp16 = reduce_mean(axes = var_2554, keep_dims = var_2538, x = zero_mean_sq_67_cast_fp16)[name = tensor("op_2555_cast_fp16")]; tensor var_2556_to_fp16 = const()[name = tensor("op_2556_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2557_cast_fp16 = add(x = var_2555_cast_fp16, y = var_2556_to_fp16)[name = tensor("op_2557_cast_fp16")]; tensor denom_67_epsilon_0 = const()[name = tensor("denom_67_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_67_cast_fp16 = rsqrt(epsilon = denom_67_epsilon_0, x = var_2557_cast_fp16)[name = tensor("denom_67_cast_fp16")]; tensor out_67_cast_fp16 = mul(x = zero_mean_67_cast_fp16, y = denom_67_cast_fp16)[name = tensor("out_67_cast_fp16")]; tensor obj_133_gamma_0_to_fp16 = const()[name = tensor("obj_133_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(355056384)))]; tensor obj_133_beta_0_to_fp16 = const()[name = tensor("obj_133_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(355059008)))]; tensor obj_133_epsilon_0_to_fp16 = const()[name = tensor("obj_133_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_133_cast_fp16 = batch_norm(beta = obj_133_beta_0_to_fp16, epsilon = obj_133_epsilon_0_to_fp16, gamma = obj_133_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_67_cast_fp16)[name = tensor("obj_133_cast_fp16")]; tensor var_2572 = const()[name = tensor("op_2572"), val = tensor([1, 1])]; tensor var_2574 = const()[name = tensor("op_2574"), val = tensor([1, 1])]; tensor query_45_pad_type_0 = const()[name = tensor("query_45_pad_type_0"), val = tensor("custom")]; tensor query_45_pad_0 = const()[name = tensor("query_45_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_11_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(355061632))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(356290496))), name = tensor("layers_11_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_11_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_11_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(356290688)))]; tensor query_45_cast_fp16 = conv(bias = layers_11_self_attn_q_proj_bias_to_fp16, dilations = var_2574, groups = var_2537, pad = query_45_pad_0, pad_type = query_45_pad_type_0, strides = var_2572, weight = layers_11_self_attn_q_proj_weight_to_fp16_palettized, x = obj_133_cast_fp16)[name = tensor("query_45_cast_fp16")]; tensor var_2578 = const()[name = tensor("op_2578"), val = tensor([1, 1])]; tensor var_2580 = const()[name = tensor("op_2580"), val = tensor([1, 1])]; tensor current_key_23_pad_type_0 = const()[name = tensor("current_key_23_pad_type_0"), val = tensor("custom")]; tensor current_key_23_pad_0 = const()[name = tensor("current_key_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_11_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(356293312))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(357522176))), name = tensor("layers_11_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_23_cast_fp16 = conv(dilations = var_2580, groups = var_2537, pad = current_key_23_pad_0, pad_type = current_key_23_pad_type_0, strides = var_2578, weight = layers_11_self_attn_k_proj_weight_to_fp16_palettized, x = obj_133_cast_fp16)[name = tensor("current_key_23_cast_fp16")]; tensor var_2585 = const()[name = tensor("op_2585"), val = tensor([1, 1])]; tensor var_2587 = const()[name = tensor("op_2587"), val = tensor([1, 1])]; tensor current_value_23_pad_type_0 = const()[name = tensor("current_value_23_pad_type_0"), val = tensor("custom")]; tensor current_value_23_pad_0 = const()[name = tensor("current_value_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_11_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(357522368))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(358341632))), name = tensor("layers_11_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_11_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_11_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(358341760)))]; tensor current_value_23_cast_fp16 = conv(bias = layers_11_self_attn_v_proj_bias_to_fp16, dilations = var_2587, groups = var_2537, pad = current_value_23_pad_0, pad_type = current_value_23_pad_type_0, strides = var_2585, weight = layers_11_self_attn_v_proj_weight_to_fp16_palettized, x = obj_133_cast_fp16)[name = tensor("current_value_23_cast_fp16")]; tensor var_2594_cast_fp16 = mul(x = current_key_23_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_2594_cast_fp16")]; tensor var_2596_cast_fp16 = mul(x = var_103_cast_fp16_11, y = var_241_cast_fp16)[name = tensor("op_2596_cast_fp16")]; tensor key_45_cast_fp16 = add(x = var_2594_cast_fp16, y = var_2596_cast_fp16)[name = tensor("key_45_cast_fp16")]; tensor var_2598_cast_fp16 = mul(x = current_value_23_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_2598_cast_fp16")]; tensor var_2600_cast_fp16 = mul(x = var_138_cast_fp16_11, y = var_241_cast_fp16)[name = tensor("op_2600_cast_fp16")]; tensor value_45_cast_fp16 = add(x = var_2598_cast_fp16, y = var_2600_cast_fp16)[name = tensor("value_45_cast_fp16")]; tensor var_2603 = const()[name = tensor("op_2603"), val = tensor([1, 20, 64, -1])]; tensor var_2604_cast_fp16 = reshape(shape = var_2603, x = query_45_cast_fp16)[name = tensor("op_2604_cast_fp16")]; tensor var_2605_to_fp16 = const()[name = tensor("op_2605_to_fp16"), val = tensor(0x1p-3)]; tensor var_2606_cast_fp16 = mul(x = var_2604_cast_fp16, y = var_2605_to_fp16)[name = tensor("op_2606_cast_fp16")]; tensor var_2607 = const()[name = tensor("op_2607"), val = tensor([1, 20, 64, -1])]; tensor var_2608_cast_fp16 = reshape(shape = var_2607, x = key_45_cast_fp16)[name = tensor("op_2608_cast_fp16")]; tensor mh_w_67_transpose_x_0 = const()[name = tensor("mh_w_67_transpose_x_0"), val = tensor(true)]; tensor mh_w_67_transpose_y_0 = const()[name = tensor("mh_w_67_transpose_y_0"), val = tensor(false)]; tensor mh_w_67_cast_fp16 = matmul(transpose_x = mh_w_67_transpose_x_0, transpose_y = mh_w_67_transpose_y_0, x = var_2606_cast_fp16, y = var_2608_cast_fp16)[name = tensor("mh_w_67_cast_fp16")]; tensor mh_w_69_cast_fp16 = add(x = mh_w_67_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_69_cast_fp16")]; tensor var_2616_cast_fp16 = softmax(axis = var_2530, x = mh_w_69_cast_fp16)[name = tensor("op_2616_cast_fp16")]; tensor var_2617 = const()[name = tensor("op_2617"), val = tensor([1, 20, 64, -1])]; tensor var_2618_cast_fp16 = reshape(shape = var_2617, x = value_45_cast_fp16)[name = tensor("op_2618_cast_fp16")]; tensor attn_45_transpose_x_0 = const()[name = tensor("attn_45_transpose_x_0"), val = tensor(false)]; tensor attn_45_transpose_y_0 = const()[name = tensor("attn_45_transpose_y_0"), val = tensor(true)]; tensor attn_45_cast_fp16 = matmul(transpose_x = attn_45_transpose_x_0, transpose_y = attn_45_transpose_y_0, x = var_2618_cast_fp16, y = var_2616_cast_fp16)[name = tensor("attn_45_cast_fp16")]; tensor var_2621 = const()[name = tensor("op_2621"), val = tensor([1, 1280, 1, -1])]; tensor input_111_cast_fp16 = reshape(shape = var_2621, x = attn_45_cast_fp16)[name = tensor("input_111_cast_fp16")]; tensor var_2625 = const()[name = tensor("op_2625"), val = tensor([1, 1])]; tensor var_2627 = const()[name = tensor("op_2627"), val = tensor([1, 1])]; tensor obj_139_pad_type_0 = const()[name = tensor("obj_139_pad_type_0"), val = tensor("custom")]; tensor obj_139_pad_0 = const()[name = tensor("obj_139_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_11_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(358344384))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(359573248))), name = tensor("layers_11_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_11_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_11_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(359573440)))]; tensor obj_139_cast_fp16 = conv(bias = layers_11_self_attn_o_proj_bias_to_fp16, dilations = var_2627, groups = var_2537, pad = obj_139_pad_0, pad_type = obj_139_pad_type_0, strides = var_2625, weight = layers_11_self_attn_o_proj_weight_to_fp16_palettized, x = input_111_cast_fp16)[name = tensor("obj_139_cast_fp16")]; tensor inputs_69_cast_fp16 = add(x = inputs_67_cast_fp16, y = obj_139_cast_fp16)[name = tensor("inputs_69_cast_fp16")]; tensor var_2637 = const()[name = tensor("op_2637"), val = tensor([1])]; tensor channels_mean_69_cast_fp16 = reduce_mean(axes = var_2637, keep_dims = var_2538, x = inputs_69_cast_fp16)[name = tensor("channels_mean_69_cast_fp16")]; tensor zero_mean_69_cast_fp16 = sub(x = inputs_69_cast_fp16, y = channels_mean_69_cast_fp16)[name = tensor("zero_mean_69_cast_fp16")]; tensor zero_mean_sq_69_cast_fp16 = mul(x = zero_mean_69_cast_fp16, y = zero_mean_69_cast_fp16)[name = tensor("zero_mean_sq_69_cast_fp16")]; tensor var_2641 = const()[name = tensor("op_2641"), val = tensor([1])]; tensor var_2642_cast_fp16 = reduce_mean(axes = var_2641, keep_dims = var_2538, x = zero_mean_sq_69_cast_fp16)[name = tensor("op_2642_cast_fp16")]; tensor var_2643_to_fp16 = const()[name = tensor("op_2643_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2644_cast_fp16 = add(x = var_2642_cast_fp16, y = var_2643_to_fp16)[name = tensor("op_2644_cast_fp16")]; tensor denom_69_epsilon_0 = const()[name = tensor("denom_69_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_69_cast_fp16 = rsqrt(epsilon = denom_69_epsilon_0, x = var_2644_cast_fp16)[name = tensor("denom_69_cast_fp16")]; tensor out_69_cast_fp16 = mul(x = zero_mean_69_cast_fp16, y = denom_69_cast_fp16)[name = tensor("out_69_cast_fp16")]; tensor obj_141_gamma_0_to_fp16 = const()[name = tensor("obj_141_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(359576064)))]; tensor obj_141_beta_0_to_fp16 = const()[name = tensor("obj_141_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(359578688)))]; tensor obj_141_epsilon_0_to_fp16 = const()[name = tensor("obj_141_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_141_cast_fp16 = batch_norm(beta = obj_141_beta_0_to_fp16, epsilon = obj_141_epsilon_0_to_fp16, gamma = obj_141_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_69_cast_fp16)[name = tensor("obj_141_cast_fp16")]; tensor var_2659 = const()[name = tensor("op_2659"), val = tensor([1, 1])]; tensor var_2661 = const()[name = tensor("op_2661"), val = tensor([1, 1])]; tensor query_47_pad_type_0 = const()[name = tensor("query_47_pad_type_0"), val = tensor("custom")]; tensor query_47_pad_0 = const()[name = tensor("query_47_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_11_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(359581312))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(360400576))), name = tensor("layers_11_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_11_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_11_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(360400704)))]; tensor query_47_cast_fp16 = conv(bias = layers_11_encoder_attn_q_proj_bias_to_fp16, dilations = var_2661, groups = var_2537, pad = query_47_pad_0, pad_type = query_47_pad_type_0, strides = var_2659, weight = layers_11_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_141_cast_fp16)[name = tensor("query_47_cast_fp16")]; tensor var_2665 = const()[name = tensor("op_2665"), val = tensor([1, 1])]; tensor var_2667 = const()[name = tensor("op_2667"), val = tensor([1, 1])]; tensor key_47_pad_type_0 = const()[name = tensor("key_47_pad_type_0"), val = tensor("custom")]; tensor key_47_pad_0 = const()[name = tensor("key_47_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_11_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(360403328))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361222592))), name = tensor("layers_11_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_47_cast_fp16 = conv(dilations = var_2667, groups = var_2537, pad = key_47_pad_0, pad_type = key_47_pad_type_0, strides = var_2665, weight = layers_11_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_47_cast_fp16")]; tensor var_2672 = const()[name = tensor("op_2672"), val = tensor([1, 1])]; tensor var_2674 = const()[name = tensor("op_2674"), val = tensor([1, 1])]; tensor value_47_pad_type_0 = const()[name = tensor("value_47_pad_type_0"), val = tensor("custom")]; tensor value_47_pad_0 = const()[name = tensor("value_47_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_11_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(361222720))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362041984))), name = tensor("layers_11_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_11_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_11_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362042112)))]; tensor value_47_cast_fp16 = conv(bias = layers_11_encoder_attn_v_proj_bias_to_fp16, dilations = var_2674, groups = var_2537, pad = value_47_pad_0, pad_type = value_47_pad_type_0, strides = var_2672, weight = layers_11_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_47_cast_fp16")]; tensor var_2678 = const()[name = tensor("op_2678"), val = tensor([1, 20, 64, -1])]; tensor var_2679_cast_fp16 = reshape(shape = var_2678, x = query_47_cast_fp16)[name = tensor("op_2679_cast_fp16")]; tensor var_2680_to_fp16 = const()[name = tensor("op_2680_to_fp16"), val = tensor(0x1p-3)]; tensor var_2681_cast_fp16 = mul(x = var_2679_cast_fp16, y = var_2680_to_fp16)[name = tensor("op_2681_cast_fp16")]; tensor var_2682 = const()[name = tensor("op_2682"), val = tensor([1, 20, 64, -1])]; tensor var_2683_cast_fp16 = reshape(shape = var_2682, x = key_47_cast_fp16)[name = tensor("op_2683_cast_fp16")]; tensor mh_w_71_transpose_x_0 = const()[name = tensor("mh_w_71_transpose_x_0"), val = tensor(true)]; tensor mh_w_71_transpose_y_0 = const()[name = tensor("mh_w_71_transpose_y_0"), val = tensor(false)]; tensor mh_w_71_cast_fp16 = matmul(transpose_x = mh_w_71_transpose_x_0, transpose_y = mh_w_71_transpose_y_0, x = var_2681_cast_fp16, y = var_2683_cast_fp16)[name = tensor("mh_w_71_cast_fp16")]; tensor var_2686_cast_fp16 = softmax(axis = var_2530, x = mh_w_71_cast_fp16)[name = tensor("op_2686_cast_fp16")]; tensor var_2687 = const()[name = tensor("op_2687"), val = tensor([1, 20, 64, -1])]; tensor var_2688_cast_fp16 = reshape(shape = var_2687, x = value_47_cast_fp16)[name = tensor("op_2688_cast_fp16")]; tensor attn_47_transpose_x_0 = const()[name = tensor("attn_47_transpose_x_0"), val = tensor(false)]; tensor attn_47_transpose_y_0 = const()[name = tensor("attn_47_transpose_y_0"), val = tensor(true)]; tensor attn_47_cast_fp16 = matmul(transpose_x = attn_47_transpose_x_0, transpose_y = attn_47_transpose_y_0, x = var_2688_cast_fp16, y = var_2686_cast_fp16)[name = tensor("attn_47_cast_fp16")]; tensor var_2691 = const()[name = tensor("op_2691"), val = tensor([1, 1280, 1, -1])]; tensor input_113_cast_fp16 = reshape(shape = var_2691, x = attn_47_cast_fp16)[name = tensor("input_113_cast_fp16")]; tensor var_2695 = const()[name = tensor("op_2695"), val = tensor([1, 1])]; tensor var_2697 = const()[name = tensor("op_2697"), val = tensor([1, 1])]; tensor obj_143_pad_type_0 = const()[name = tensor("obj_143_pad_type_0"), val = tensor("custom")]; tensor obj_143_pad_0 = const()[name = tensor("obj_143_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_11_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362044736))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362864000))), name = tensor("layers_11_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_11_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_11_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362864128)))]; tensor obj_143_cast_fp16 = conv(bias = layers_11_encoder_attn_o_proj_bias_to_fp16, dilations = var_2697, groups = var_2537, pad = obj_143_pad_0, pad_type = obj_143_pad_type_0, strides = var_2695, weight = layers_11_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_113_cast_fp16)[name = tensor("obj_143_cast_fp16")]; tensor inputs_71_cast_fp16 = add(x = inputs_69_cast_fp16, y = obj_143_cast_fp16)[name = tensor("inputs_71_cast_fp16")]; tensor var_2703 = const()[name = tensor("op_2703"), val = tensor([1])]; tensor channels_mean_71_cast_fp16 = reduce_mean(axes = var_2703, keep_dims = var_2538, x = inputs_71_cast_fp16)[name = tensor("channels_mean_71_cast_fp16")]; tensor zero_mean_71_cast_fp16 = sub(x = inputs_71_cast_fp16, y = channels_mean_71_cast_fp16)[name = tensor("zero_mean_71_cast_fp16")]; tensor zero_mean_sq_71_cast_fp16 = mul(x = zero_mean_71_cast_fp16, y = zero_mean_71_cast_fp16)[name = tensor("zero_mean_sq_71_cast_fp16")]; tensor var_2707 = const()[name = tensor("op_2707"), val = tensor([1])]; tensor var_2708_cast_fp16 = reduce_mean(axes = var_2707, keep_dims = var_2538, x = zero_mean_sq_71_cast_fp16)[name = tensor("op_2708_cast_fp16")]; tensor var_2709_to_fp16 = const()[name = tensor("op_2709_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2710_cast_fp16 = add(x = var_2708_cast_fp16, y = var_2709_to_fp16)[name = tensor("op_2710_cast_fp16")]; tensor denom_71_epsilon_0 = const()[name = tensor("denom_71_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_71_cast_fp16 = rsqrt(epsilon = denom_71_epsilon_0, x = var_2710_cast_fp16)[name = tensor("denom_71_cast_fp16")]; tensor out_71_cast_fp16 = mul(x = zero_mean_71_cast_fp16, y = denom_71_cast_fp16)[name = tensor("out_71_cast_fp16")]; tensor input_115_gamma_0_to_fp16 = const()[name = tensor("input_115_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362866752)))]; tensor input_115_beta_0_to_fp16 = const()[name = tensor("input_115_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362869376)))]; tensor input_115_epsilon_0_to_fp16 = const()[name = tensor("input_115_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_115_cast_fp16 = batch_norm(beta = input_115_beta_0_to_fp16, epsilon = input_115_epsilon_0_to_fp16, gamma = input_115_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_71_cast_fp16)[name = tensor("input_115_cast_fp16")]; tensor var_2721 = const()[name = tensor("op_2721"), val = tensor([1, 1])]; tensor var_2723 = const()[name = tensor("op_2723"), val = tensor([1, 1])]; tensor input_117_pad_type_0 = const()[name = tensor("input_117_pad_type_0"), val = tensor("custom")]; tensor input_117_pad_0 = const()[name = tensor("input_117_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_11_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362872000))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369425664))), name = tensor("layers_11_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_11_fc1_bias_to_fp16 = const()[name = tensor("layers_11_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369426240)))]; tensor input_117_cast_fp16 = conv(bias = layers_11_fc1_bias_to_fp16, dilations = var_2723, groups = var_2537, pad = input_117_pad_0, pad_type = input_117_pad_type_0, strides = var_2721, weight = layers_11_fc1_weight_to_fp16_palettized, x = input_115_cast_fp16)[name = tensor("input_117_cast_fp16")]; tensor input_119_mode_0 = const()[name = tensor("input_119_mode_0"), val = tensor("EXACT")]; tensor input_119_cast_fp16 = gelu(mode = input_119_mode_0, x = input_117_cast_fp16)[name = tensor("input_119_cast_fp16")]; tensor var_2729 = const()[name = tensor("op_2729"), val = tensor([1, 1])]; tensor var_2731 = const()[name = tensor("op_2731"), val = tensor([1, 1])]; tensor hidden_states_25_pad_type_0 = const()[name = tensor("hidden_states_25_pad_type_0"), val = tensor("custom")]; tensor hidden_states_25_pad_0 = const()[name = tensor("hidden_states_25_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_11_fc2_weight_to_fp16 = const()[name = tensor("layers_11_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(369436544)))]; tensor layers_11_fc2_bias_to_fp16 = const()[name = tensor("layers_11_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382543808)))]; tensor hidden_states_25_cast_fp16 = conv(bias = layers_11_fc2_bias_to_fp16, dilations = var_2731, groups = var_2537, pad = hidden_states_25_pad_0, pad_type = hidden_states_25_pad_type_0, strides = var_2729, weight = layers_11_fc2_weight_to_fp16, x = input_119_cast_fp16)[name = tensor("hidden_states_25_cast_fp16")]; tensor inputs_73_cast_fp16 = add(x = inputs_71_cast_fp16, y = hidden_states_25_cast_fp16)[name = tensor("inputs_73_cast_fp16")]; tensor var_2744 = const()[name = tensor("op_2744"), val = tensor(3)]; tensor var_2751 = const()[name = tensor("op_2751"), val = tensor(1)]; tensor var_2752 = const()[name = tensor("op_2752"), val = tensor(true)]; tensor var_2764 = const()[name = tensor("op_2764"), val = tensor([1])]; tensor channels_mean_73_cast_fp16 = reduce_mean(axes = var_2764, keep_dims = var_2752, x = inputs_73_cast_fp16)[name = tensor("channels_mean_73_cast_fp16")]; tensor zero_mean_73_cast_fp16 = sub(x = inputs_73_cast_fp16, y = channels_mean_73_cast_fp16)[name = tensor("zero_mean_73_cast_fp16")]; tensor zero_mean_sq_73_cast_fp16 = mul(x = zero_mean_73_cast_fp16, y = zero_mean_73_cast_fp16)[name = tensor("zero_mean_sq_73_cast_fp16")]; tensor var_2768 = const()[name = tensor("op_2768"), val = tensor([1])]; tensor var_2769_cast_fp16 = reduce_mean(axes = var_2768, keep_dims = var_2752, x = zero_mean_sq_73_cast_fp16)[name = tensor("op_2769_cast_fp16")]; tensor var_2770_to_fp16 = const()[name = tensor("op_2770_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2771_cast_fp16 = add(x = var_2769_cast_fp16, y = var_2770_to_fp16)[name = tensor("op_2771_cast_fp16")]; tensor denom_73_epsilon_0 = const()[name = tensor("denom_73_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_73_cast_fp16 = rsqrt(epsilon = denom_73_epsilon_0, x = var_2771_cast_fp16)[name = tensor("denom_73_cast_fp16")]; tensor out_73_cast_fp16 = mul(x = zero_mean_73_cast_fp16, y = denom_73_cast_fp16)[name = tensor("out_73_cast_fp16")]; tensor obj_145_gamma_0_to_fp16 = const()[name = tensor("obj_145_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382546432)))]; tensor obj_145_beta_0_to_fp16 = const()[name = tensor("obj_145_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382549056)))]; tensor obj_145_epsilon_0_to_fp16 = const()[name = tensor("obj_145_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_145_cast_fp16 = batch_norm(beta = obj_145_beta_0_to_fp16, epsilon = obj_145_epsilon_0_to_fp16, gamma = obj_145_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_73_cast_fp16)[name = tensor("obj_145_cast_fp16")]; tensor var_2786 = const()[name = tensor("op_2786"), val = tensor([1, 1])]; tensor var_2788 = const()[name = tensor("op_2788"), val = tensor([1, 1])]; tensor query_49_pad_type_0 = const()[name = tensor("query_49_pad_type_0"), val = tensor("custom")]; tensor query_49_pad_0 = const()[name = tensor("query_49_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_12_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(382551680))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(383780544))), name = tensor("layers_12_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_12_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_12_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(383780736)))]; tensor query_49_cast_fp16 = conv(bias = layers_12_self_attn_q_proj_bias_to_fp16, dilations = var_2788, groups = var_2751, pad = query_49_pad_0, pad_type = query_49_pad_type_0, strides = var_2786, weight = layers_12_self_attn_q_proj_weight_to_fp16_palettized, x = obj_145_cast_fp16)[name = tensor("query_49_cast_fp16")]; tensor var_2792 = const()[name = tensor("op_2792"), val = tensor([1, 1])]; tensor var_2794 = const()[name = tensor("op_2794"), val = tensor([1, 1])]; tensor current_key_25_pad_type_0 = const()[name = tensor("current_key_25_pad_type_0"), val = tensor("custom")]; tensor current_key_25_pad_0 = const()[name = tensor("current_key_25_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_12_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(383783360))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(384602624))), name = tensor("layers_12_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_25_cast_fp16 = conv(dilations = var_2794, groups = var_2751, pad = current_key_25_pad_0, pad_type = current_key_25_pad_type_0, strides = var_2792, weight = layers_12_self_attn_k_proj_weight_to_fp16_palettized, x = obj_145_cast_fp16)[name = tensor("current_key_25_cast_fp16")]; tensor var_2799 = const()[name = tensor("op_2799"), val = tensor([1, 1])]; tensor var_2801 = const()[name = tensor("op_2801"), val = tensor([1, 1])]; tensor current_value_25_pad_type_0 = const()[name = tensor("current_value_25_pad_type_0"), val = tensor("custom")]; tensor current_value_25_pad_0 = const()[name = tensor("current_value_25_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_12_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(384602752))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(385422016))), name = tensor("layers_12_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_12_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_12_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(385422144)))]; tensor current_value_25_cast_fp16 = conv(bias = layers_12_self_attn_v_proj_bias_to_fp16, dilations = var_2801, groups = var_2751, pad = current_value_25_pad_0, pad_type = current_value_25_pad_type_0, strides = var_2799, weight = layers_12_self_attn_v_proj_weight_to_fp16_palettized, x = obj_145_cast_fp16)[name = tensor("current_value_25_cast_fp16")]; tensor var_2808_cast_fp16 = mul(x = current_key_25_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_2808_cast_fp16")]; tensor var_2810_cast_fp16 = mul(x = var_103_cast_fp16_12, y = var_241_cast_fp16)[name = tensor("op_2810_cast_fp16")]; tensor key_49_cast_fp16 = add(x = var_2808_cast_fp16, y = var_2810_cast_fp16)[name = tensor("key_49_cast_fp16")]; tensor var_2812_cast_fp16 = mul(x = current_value_25_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_2812_cast_fp16")]; tensor var_2814_cast_fp16 = mul(x = var_138_cast_fp16_12, y = var_241_cast_fp16)[name = tensor("op_2814_cast_fp16")]; tensor value_49_cast_fp16 = add(x = var_2812_cast_fp16, y = var_2814_cast_fp16)[name = tensor("value_49_cast_fp16")]; tensor var_2817 = const()[name = tensor("op_2817"), val = tensor([1, 20, 64, -1])]; tensor var_2818_cast_fp16 = reshape(shape = var_2817, x = query_49_cast_fp16)[name = tensor("op_2818_cast_fp16")]; tensor var_2819_to_fp16 = const()[name = tensor("op_2819_to_fp16"), val = tensor(0x1p-3)]; tensor var_2820_cast_fp16 = mul(x = var_2818_cast_fp16, y = var_2819_to_fp16)[name = tensor("op_2820_cast_fp16")]; tensor var_2821 = const()[name = tensor("op_2821"), val = tensor([1, 20, 64, -1])]; tensor var_2822_cast_fp16 = reshape(shape = var_2821, x = key_49_cast_fp16)[name = tensor("op_2822_cast_fp16")]; tensor mh_w_73_transpose_x_0 = const()[name = tensor("mh_w_73_transpose_x_0"), val = tensor(true)]; tensor mh_w_73_transpose_y_0 = const()[name = tensor("mh_w_73_transpose_y_0"), val = tensor(false)]; tensor mh_w_73_cast_fp16 = matmul(transpose_x = mh_w_73_transpose_x_0, transpose_y = mh_w_73_transpose_y_0, x = var_2820_cast_fp16, y = var_2822_cast_fp16)[name = tensor("mh_w_73_cast_fp16")]; tensor mh_w_75_cast_fp16 = add(x = mh_w_73_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_75_cast_fp16")]; tensor var_2830_cast_fp16 = softmax(axis = var_2744, x = mh_w_75_cast_fp16)[name = tensor("op_2830_cast_fp16")]; tensor var_2831 = const()[name = tensor("op_2831"), val = tensor([1, 20, 64, -1])]; tensor var_2832_cast_fp16 = reshape(shape = var_2831, x = value_49_cast_fp16)[name = tensor("op_2832_cast_fp16")]; tensor attn_49_transpose_x_0 = const()[name = tensor("attn_49_transpose_x_0"), val = tensor(false)]; tensor attn_49_transpose_y_0 = const()[name = tensor("attn_49_transpose_y_0"), val = tensor(true)]; tensor attn_49_cast_fp16 = matmul(transpose_x = attn_49_transpose_x_0, transpose_y = attn_49_transpose_y_0, x = var_2832_cast_fp16, y = var_2830_cast_fp16)[name = tensor("attn_49_cast_fp16")]; tensor var_2835 = const()[name = tensor("op_2835"), val = tensor([1, 1280, 1, -1])]; tensor input_121_cast_fp16 = reshape(shape = var_2835, x = attn_49_cast_fp16)[name = tensor("input_121_cast_fp16")]; tensor var_2839 = const()[name = tensor("op_2839"), val = tensor([1, 1])]; tensor var_2841 = const()[name = tensor("op_2841"), val = tensor([1, 1])]; tensor obj_151_pad_type_0 = const()[name = tensor("obj_151_pad_type_0"), val = tensor("custom")]; tensor obj_151_pad_0 = const()[name = tensor("obj_151_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_12_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(385424768))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(386653632))), name = tensor("layers_12_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_12_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_12_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(386653824)))]; tensor obj_151_cast_fp16 = conv(bias = layers_12_self_attn_o_proj_bias_to_fp16, dilations = var_2841, groups = var_2751, pad = obj_151_pad_0, pad_type = obj_151_pad_type_0, strides = var_2839, weight = layers_12_self_attn_o_proj_weight_to_fp16_palettized, x = input_121_cast_fp16)[name = tensor("obj_151_cast_fp16")]; tensor inputs_75_cast_fp16 = add(x = inputs_73_cast_fp16, y = obj_151_cast_fp16)[name = tensor("inputs_75_cast_fp16")]; tensor var_2851 = const()[name = tensor("op_2851"), val = tensor([1])]; tensor channels_mean_75_cast_fp16 = reduce_mean(axes = var_2851, keep_dims = var_2752, x = inputs_75_cast_fp16)[name = tensor("channels_mean_75_cast_fp16")]; tensor zero_mean_75_cast_fp16 = sub(x = inputs_75_cast_fp16, y = channels_mean_75_cast_fp16)[name = tensor("zero_mean_75_cast_fp16")]; tensor zero_mean_sq_75_cast_fp16 = mul(x = zero_mean_75_cast_fp16, y = zero_mean_75_cast_fp16)[name = tensor("zero_mean_sq_75_cast_fp16")]; tensor var_2855 = const()[name = tensor("op_2855"), val = tensor([1])]; tensor var_2856_cast_fp16 = reduce_mean(axes = var_2855, keep_dims = var_2752, x = zero_mean_sq_75_cast_fp16)[name = tensor("op_2856_cast_fp16")]; tensor var_2857_to_fp16 = const()[name = tensor("op_2857_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2858_cast_fp16 = add(x = var_2856_cast_fp16, y = var_2857_to_fp16)[name = tensor("op_2858_cast_fp16")]; tensor denom_75_epsilon_0 = const()[name = tensor("denom_75_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_75_cast_fp16 = rsqrt(epsilon = denom_75_epsilon_0, x = var_2858_cast_fp16)[name = tensor("denom_75_cast_fp16")]; tensor out_75_cast_fp16 = mul(x = zero_mean_75_cast_fp16, y = denom_75_cast_fp16)[name = tensor("out_75_cast_fp16")]; tensor obj_153_gamma_0_to_fp16 = const()[name = tensor("obj_153_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(386656448)))]; tensor obj_153_beta_0_to_fp16 = const()[name = tensor("obj_153_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(386659072)))]; tensor obj_153_epsilon_0_to_fp16 = const()[name = tensor("obj_153_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_153_cast_fp16 = batch_norm(beta = obj_153_beta_0_to_fp16, epsilon = obj_153_epsilon_0_to_fp16, gamma = obj_153_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_75_cast_fp16)[name = tensor("obj_153_cast_fp16")]; tensor var_2873 = const()[name = tensor("op_2873"), val = tensor([1, 1])]; tensor var_2875 = const()[name = tensor("op_2875"), val = tensor([1, 1])]; tensor query_51_pad_type_0 = const()[name = tensor("query_51_pad_type_0"), val = tensor("custom")]; tensor query_51_pad_0 = const()[name = tensor("query_51_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_12_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(386661696))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387480960))), name = tensor("layers_12_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_12_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_12_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387481088)))]; tensor query_51_cast_fp16 = conv(bias = layers_12_encoder_attn_q_proj_bias_to_fp16, dilations = var_2875, groups = var_2751, pad = query_51_pad_0, pad_type = query_51_pad_type_0, strides = var_2873, weight = layers_12_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_153_cast_fp16)[name = tensor("query_51_cast_fp16")]; tensor var_2879 = const()[name = tensor("op_2879"), val = tensor([1, 1])]; tensor var_2881 = const()[name = tensor("op_2881"), val = tensor([1, 1])]; tensor key_51_pad_type_0 = const()[name = tensor("key_51_pad_type_0"), val = tensor("custom")]; tensor key_51_pad_0 = const()[name = tensor("key_51_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_12_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387483712))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(388302976))), name = tensor("layers_12_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_51_cast_fp16 = conv(dilations = var_2881, groups = var_2751, pad = key_51_pad_0, pad_type = key_51_pad_type_0, strides = var_2879, weight = layers_12_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_51_cast_fp16")]; tensor var_2886 = const()[name = tensor("op_2886"), val = tensor([1, 1])]; tensor var_2888 = const()[name = tensor("op_2888"), val = tensor([1, 1])]; tensor value_51_pad_type_0 = const()[name = tensor("value_51_pad_type_0"), val = tensor("custom")]; tensor value_51_pad_0 = const()[name = tensor("value_51_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_12_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(388303104))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(389122368))), name = tensor("layers_12_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_12_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_12_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(389122496)))]; tensor value_51_cast_fp16 = conv(bias = layers_12_encoder_attn_v_proj_bias_to_fp16, dilations = var_2888, groups = var_2751, pad = value_51_pad_0, pad_type = value_51_pad_type_0, strides = var_2886, weight = layers_12_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_51_cast_fp16")]; tensor var_2892 = const()[name = tensor("op_2892"), val = tensor([1, 20, 64, -1])]; tensor var_2893_cast_fp16 = reshape(shape = var_2892, x = query_51_cast_fp16)[name = tensor("op_2893_cast_fp16")]; tensor var_2894_to_fp16 = const()[name = tensor("op_2894_to_fp16"), val = tensor(0x1p-3)]; tensor var_2895_cast_fp16 = mul(x = var_2893_cast_fp16, y = var_2894_to_fp16)[name = tensor("op_2895_cast_fp16")]; tensor var_2896 = const()[name = tensor("op_2896"), val = tensor([1, 20, 64, -1])]; tensor var_2897_cast_fp16 = reshape(shape = var_2896, x = key_51_cast_fp16)[name = tensor("op_2897_cast_fp16")]; tensor mh_w_77_transpose_x_0 = const()[name = tensor("mh_w_77_transpose_x_0"), val = tensor(true)]; tensor mh_w_77_transpose_y_0 = const()[name = tensor("mh_w_77_transpose_y_0"), val = tensor(false)]; tensor mh_w_77_cast_fp16 = matmul(transpose_x = mh_w_77_transpose_x_0, transpose_y = mh_w_77_transpose_y_0, x = var_2895_cast_fp16, y = var_2897_cast_fp16)[name = tensor("mh_w_77_cast_fp16")]; tensor var_2900_cast_fp16 = softmax(axis = var_2744, x = mh_w_77_cast_fp16)[name = tensor("op_2900_cast_fp16")]; tensor var_2901 = const()[name = tensor("op_2901"), val = tensor([1, 20, 64, -1])]; tensor var_2902_cast_fp16 = reshape(shape = var_2901, x = value_51_cast_fp16)[name = tensor("op_2902_cast_fp16")]; tensor attn_51_transpose_x_0 = const()[name = tensor("attn_51_transpose_x_0"), val = tensor(false)]; tensor attn_51_transpose_y_0 = const()[name = tensor("attn_51_transpose_y_0"), val = tensor(true)]; tensor attn_51_cast_fp16 = matmul(transpose_x = attn_51_transpose_x_0, transpose_y = attn_51_transpose_y_0, x = var_2902_cast_fp16, y = var_2900_cast_fp16)[name = tensor("attn_51_cast_fp16")]; tensor var_2905 = const()[name = tensor("op_2905"), val = tensor([1, 1280, 1, -1])]; tensor input_123_cast_fp16 = reshape(shape = var_2905, x = attn_51_cast_fp16)[name = tensor("input_123_cast_fp16")]; tensor var_2909 = const()[name = tensor("op_2909"), val = tensor([1, 1])]; tensor var_2911 = const()[name = tensor("op_2911"), val = tensor([1, 1])]; tensor obj_155_pad_type_0 = const()[name = tensor("obj_155_pad_type_0"), val = tensor("custom")]; tensor obj_155_pad_0 = const()[name = tensor("obj_155_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_12_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(389125120))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390353984))), name = tensor("layers_12_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_12_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_12_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390354176)))]; tensor obj_155_cast_fp16 = conv(bias = layers_12_encoder_attn_o_proj_bias_to_fp16, dilations = var_2911, groups = var_2751, pad = obj_155_pad_0, pad_type = obj_155_pad_type_0, strides = var_2909, weight = layers_12_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_123_cast_fp16)[name = tensor("obj_155_cast_fp16")]; tensor inputs_77_cast_fp16 = add(x = inputs_75_cast_fp16, y = obj_155_cast_fp16)[name = tensor("inputs_77_cast_fp16")]; tensor var_2917 = const()[name = tensor("op_2917"), val = tensor([1])]; tensor channels_mean_77_cast_fp16 = reduce_mean(axes = var_2917, keep_dims = var_2752, x = inputs_77_cast_fp16)[name = tensor("channels_mean_77_cast_fp16")]; tensor zero_mean_77_cast_fp16 = sub(x = inputs_77_cast_fp16, y = channels_mean_77_cast_fp16)[name = tensor("zero_mean_77_cast_fp16")]; tensor zero_mean_sq_77_cast_fp16 = mul(x = zero_mean_77_cast_fp16, y = zero_mean_77_cast_fp16)[name = tensor("zero_mean_sq_77_cast_fp16")]; tensor var_2921 = const()[name = tensor("op_2921"), val = tensor([1])]; tensor var_2922_cast_fp16 = reduce_mean(axes = var_2921, keep_dims = var_2752, x = zero_mean_sq_77_cast_fp16)[name = tensor("op_2922_cast_fp16")]; tensor var_2923_to_fp16 = const()[name = tensor("op_2923_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2924_cast_fp16 = add(x = var_2922_cast_fp16, y = var_2923_to_fp16)[name = tensor("op_2924_cast_fp16")]; tensor denom_77_epsilon_0 = const()[name = tensor("denom_77_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_77_cast_fp16 = rsqrt(epsilon = denom_77_epsilon_0, x = var_2924_cast_fp16)[name = tensor("denom_77_cast_fp16")]; tensor out_77_cast_fp16 = mul(x = zero_mean_77_cast_fp16, y = denom_77_cast_fp16)[name = tensor("out_77_cast_fp16")]; tensor input_125_gamma_0_to_fp16 = const()[name = tensor("input_125_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390356800)))]; tensor input_125_beta_0_to_fp16 = const()[name = tensor("input_125_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390359424)))]; tensor input_125_epsilon_0_to_fp16 = const()[name = tensor("input_125_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_125_cast_fp16 = batch_norm(beta = input_125_beta_0_to_fp16, epsilon = input_125_epsilon_0_to_fp16, gamma = input_125_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_77_cast_fp16)[name = tensor("input_125_cast_fp16")]; tensor var_2935 = const()[name = tensor("op_2935"), val = tensor([1, 1])]; tensor var_2937 = const()[name = tensor("op_2937"), val = tensor([1, 1])]; tensor input_127_pad_type_0 = const()[name = tensor("input_127_pad_type_0"), val = tensor("custom")]; tensor input_127_pad_0 = const()[name = tensor("input_127_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_12_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(390362048))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(396915712))), name = tensor("layers_12_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_12_fc1_bias_to_fp16 = const()[name = tensor("layers_12_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(396916288)))]; tensor input_127_cast_fp16 = conv(bias = layers_12_fc1_bias_to_fp16, dilations = var_2937, groups = var_2751, pad = input_127_pad_0, pad_type = input_127_pad_type_0, strides = var_2935, weight = layers_12_fc1_weight_to_fp16_palettized, x = input_125_cast_fp16)[name = tensor("input_127_cast_fp16")]; tensor input_129_mode_0 = const()[name = tensor("input_129_mode_0"), val = tensor("EXACT")]; tensor input_129_cast_fp16 = gelu(mode = input_129_mode_0, x = input_127_cast_fp16)[name = tensor("input_129_cast_fp16")]; tensor var_2943 = const()[name = tensor("op_2943"), val = tensor([1, 1])]; tensor var_2945 = const()[name = tensor("op_2945"), val = tensor([1, 1])]; tensor hidden_states_27_pad_type_0 = const()[name = tensor("hidden_states_27_pad_type_0"), val = tensor("custom")]; tensor hidden_states_27_pad_0 = const()[name = tensor("hidden_states_27_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_12_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(396926592))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(401841856))), name = tensor("layers_12_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_12_fc2_bias_to_fp16 = const()[name = tensor("layers_12_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(401842048)))]; tensor hidden_states_27_cast_fp16 = conv(bias = layers_12_fc2_bias_to_fp16, dilations = var_2945, groups = var_2751, pad = hidden_states_27_pad_0, pad_type = hidden_states_27_pad_type_0, strides = var_2943, weight = layers_12_fc2_weight_to_fp16_palettized, x = input_129_cast_fp16)[name = tensor("hidden_states_27_cast_fp16")]; tensor inputs_79_cast_fp16 = add(x = inputs_77_cast_fp16, y = hidden_states_27_cast_fp16)[name = tensor("inputs_79_cast_fp16")]; tensor var_2958 = const()[name = tensor("op_2958"), val = tensor(3)]; tensor var_2965 = const()[name = tensor("op_2965"), val = tensor(1)]; tensor var_2966 = const()[name = tensor("op_2966"), val = tensor(true)]; tensor var_2978 = const()[name = tensor("op_2978"), val = tensor([1])]; tensor channels_mean_79_cast_fp16 = reduce_mean(axes = var_2978, keep_dims = var_2966, x = inputs_79_cast_fp16)[name = tensor("channels_mean_79_cast_fp16")]; tensor zero_mean_79_cast_fp16 = sub(x = inputs_79_cast_fp16, y = channels_mean_79_cast_fp16)[name = tensor("zero_mean_79_cast_fp16")]; tensor zero_mean_sq_79_cast_fp16 = mul(x = zero_mean_79_cast_fp16, y = zero_mean_79_cast_fp16)[name = tensor("zero_mean_sq_79_cast_fp16")]; tensor var_2982 = const()[name = tensor("op_2982"), val = tensor([1])]; tensor var_2983_cast_fp16 = reduce_mean(axes = var_2982, keep_dims = var_2966, x = zero_mean_sq_79_cast_fp16)[name = tensor("op_2983_cast_fp16")]; tensor var_2984_to_fp16 = const()[name = tensor("op_2984_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2985_cast_fp16 = add(x = var_2983_cast_fp16, y = var_2984_to_fp16)[name = tensor("op_2985_cast_fp16")]; tensor denom_79_epsilon_0 = const()[name = tensor("denom_79_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_79_cast_fp16 = rsqrt(epsilon = denom_79_epsilon_0, x = var_2985_cast_fp16)[name = tensor("denom_79_cast_fp16")]; tensor out_79_cast_fp16 = mul(x = zero_mean_79_cast_fp16, y = denom_79_cast_fp16)[name = tensor("out_79_cast_fp16")]; tensor obj_157_gamma_0_to_fp16 = const()[name = tensor("obj_157_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(401844672)))]; tensor obj_157_beta_0_to_fp16 = const()[name = tensor("obj_157_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(401847296)))]; tensor obj_157_epsilon_0_to_fp16 = const()[name = tensor("obj_157_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_157_cast_fp16 = batch_norm(beta = obj_157_beta_0_to_fp16, epsilon = obj_157_epsilon_0_to_fp16, gamma = obj_157_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_79_cast_fp16)[name = tensor("obj_157_cast_fp16")]; tensor var_3000 = const()[name = tensor("op_3000"), val = tensor([1, 1])]; tensor var_3002 = const()[name = tensor("op_3002"), val = tensor([1, 1])]; tensor query_53_pad_type_0 = const()[name = tensor("query_53_pad_type_0"), val = tensor("custom")]; tensor query_53_pad_0 = const()[name = tensor("query_53_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_13_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(401849920))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(403078784))), name = tensor("layers_13_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_13_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_13_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(403078976)))]; tensor query_53_cast_fp16 = conv(bias = layers_13_self_attn_q_proj_bias_to_fp16, dilations = var_3002, groups = var_2965, pad = query_53_pad_0, pad_type = query_53_pad_type_0, strides = var_3000, weight = layers_13_self_attn_q_proj_weight_to_fp16_palettized, x = obj_157_cast_fp16)[name = tensor("query_53_cast_fp16")]; tensor var_3006 = const()[name = tensor("op_3006"), val = tensor([1, 1])]; tensor var_3008 = const()[name = tensor("op_3008"), val = tensor([1, 1])]; tensor current_key_27_pad_type_0 = const()[name = tensor("current_key_27_pad_type_0"), val = tensor("custom")]; tensor current_key_27_pad_0 = const()[name = tensor("current_key_27_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_13_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(403081600))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(404310464))), name = tensor("layers_13_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_27_cast_fp16 = conv(dilations = var_3008, groups = var_2965, pad = current_key_27_pad_0, pad_type = current_key_27_pad_type_0, strides = var_3006, weight = layers_13_self_attn_k_proj_weight_to_fp16_palettized, x = obj_157_cast_fp16)[name = tensor("current_key_27_cast_fp16")]; tensor var_3013 = const()[name = tensor("op_3013"), val = tensor([1, 1])]; tensor var_3015 = const()[name = tensor("op_3015"), val = tensor([1, 1])]; tensor current_value_27_pad_type_0 = const()[name = tensor("current_value_27_pad_type_0"), val = tensor("custom")]; tensor current_value_27_pad_0 = const()[name = tensor("current_value_27_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_13_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(404310656))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(405129920))), name = tensor("layers_13_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_13_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_13_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(405130048)))]; tensor current_value_27_cast_fp16 = conv(bias = layers_13_self_attn_v_proj_bias_to_fp16, dilations = var_3015, groups = var_2965, pad = current_value_27_pad_0, pad_type = current_value_27_pad_type_0, strides = var_3013, weight = layers_13_self_attn_v_proj_weight_to_fp16_palettized, x = obj_157_cast_fp16)[name = tensor("current_value_27_cast_fp16")]; tensor var_3022_cast_fp16 = mul(x = current_key_27_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_3022_cast_fp16")]; tensor var_3024_cast_fp16 = mul(x = var_103_cast_fp16_13, y = var_241_cast_fp16)[name = tensor("op_3024_cast_fp16")]; tensor key_53_cast_fp16 = add(x = var_3022_cast_fp16, y = var_3024_cast_fp16)[name = tensor("key_53_cast_fp16")]; tensor var_3026_cast_fp16 = mul(x = current_value_27_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_3026_cast_fp16")]; tensor var_3028_cast_fp16 = mul(x = var_138_cast_fp16_13, y = var_241_cast_fp16)[name = tensor("op_3028_cast_fp16")]; tensor value_53_cast_fp16 = add(x = var_3026_cast_fp16, y = var_3028_cast_fp16)[name = tensor("value_53_cast_fp16")]; tensor var_3031 = const()[name = tensor("op_3031"), val = tensor([1, 20, 64, -1])]; tensor var_3032_cast_fp16 = reshape(shape = var_3031, x = query_53_cast_fp16)[name = tensor("op_3032_cast_fp16")]; tensor var_3033_to_fp16 = const()[name = tensor("op_3033_to_fp16"), val = tensor(0x1p-3)]; tensor var_3034_cast_fp16 = mul(x = var_3032_cast_fp16, y = var_3033_to_fp16)[name = tensor("op_3034_cast_fp16")]; tensor var_3035 = const()[name = tensor("op_3035"), val = tensor([1, 20, 64, -1])]; tensor var_3036_cast_fp16 = reshape(shape = var_3035, x = key_53_cast_fp16)[name = tensor("op_3036_cast_fp16")]; tensor mh_w_79_transpose_x_0 = const()[name = tensor("mh_w_79_transpose_x_0"), val = tensor(true)]; tensor mh_w_79_transpose_y_0 = const()[name = tensor("mh_w_79_transpose_y_0"), val = tensor(false)]; tensor mh_w_79_cast_fp16 = matmul(transpose_x = mh_w_79_transpose_x_0, transpose_y = mh_w_79_transpose_y_0, x = var_3034_cast_fp16, y = var_3036_cast_fp16)[name = tensor("mh_w_79_cast_fp16")]; tensor mh_w_81_cast_fp16 = add(x = mh_w_79_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_81_cast_fp16")]; tensor var_3044_cast_fp16 = softmax(axis = var_2958, x = mh_w_81_cast_fp16)[name = tensor("op_3044_cast_fp16")]; tensor var_3045 = const()[name = tensor("op_3045"), val = tensor([1, 20, 64, -1])]; tensor var_3046_cast_fp16 = reshape(shape = var_3045, x = value_53_cast_fp16)[name = tensor("op_3046_cast_fp16")]; tensor attn_53_transpose_x_0 = const()[name = tensor("attn_53_transpose_x_0"), val = tensor(false)]; tensor attn_53_transpose_y_0 = const()[name = tensor("attn_53_transpose_y_0"), val = tensor(true)]; tensor attn_53_cast_fp16 = matmul(transpose_x = attn_53_transpose_x_0, transpose_y = attn_53_transpose_y_0, x = var_3046_cast_fp16, y = var_3044_cast_fp16)[name = tensor("attn_53_cast_fp16")]; tensor var_3049 = const()[name = tensor("op_3049"), val = tensor([1, 1280, 1, -1])]; tensor input_131_cast_fp16 = reshape(shape = var_3049, x = attn_53_cast_fp16)[name = tensor("input_131_cast_fp16")]; tensor var_3053 = const()[name = tensor("op_3053"), val = tensor([1, 1])]; tensor var_3055 = const()[name = tensor("op_3055"), val = tensor([1, 1])]; tensor obj_163_pad_type_0 = const()[name = tensor("obj_163_pad_type_0"), val = tensor("custom")]; tensor obj_163_pad_0 = const()[name = tensor("obj_163_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_13_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(405132672))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406361536))), name = tensor("layers_13_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_13_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_13_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406361728)))]; tensor obj_163_cast_fp16 = conv(bias = layers_13_self_attn_o_proj_bias_to_fp16, dilations = var_3055, groups = var_2965, pad = obj_163_pad_0, pad_type = obj_163_pad_type_0, strides = var_3053, weight = layers_13_self_attn_o_proj_weight_to_fp16_palettized, x = input_131_cast_fp16)[name = tensor("obj_163_cast_fp16")]; tensor inputs_81_cast_fp16 = add(x = inputs_79_cast_fp16, y = obj_163_cast_fp16)[name = tensor("inputs_81_cast_fp16")]; tensor var_3065 = const()[name = tensor("op_3065"), val = tensor([1])]; tensor channels_mean_81_cast_fp16 = reduce_mean(axes = var_3065, keep_dims = var_2966, x = inputs_81_cast_fp16)[name = tensor("channels_mean_81_cast_fp16")]; tensor zero_mean_81_cast_fp16 = sub(x = inputs_81_cast_fp16, y = channels_mean_81_cast_fp16)[name = tensor("zero_mean_81_cast_fp16")]; tensor zero_mean_sq_81_cast_fp16 = mul(x = zero_mean_81_cast_fp16, y = zero_mean_81_cast_fp16)[name = tensor("zero_mean_sq_81_cast_fp16")]; tensor var_3069 = const()[name = tensor("op_3069"), val = tensor([1])]; tensor var_3070_cast_fp16 = reduce_mean(axes = var_3069, keep_dims = var_2966, x = zero_mean_sq_81_cast_fp16)[name = tensor("op_3070_cast_fp16")]; tensor var_3071_to_fp16 = const()[name = tensor("op_3071_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3072_cast_fp16 = add(x = var_3070_cast_fp16, y = var_3071_to_fp16)[name = tensor("op_3072_cast_fp16")]; tensor denom_81_epsilon_0 = const()[name = tensor("denom_81_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_81_cast_fp16 = rsqrt(epsilon = denom_81_epsilon_0, x = var_3072_cast_fp16)[name = tensor("denom_81_cast_fp16")]; tensor out_81_cast_fp16 = mul(x = zero_mean_81_cast_fp16, y = denom_81_cast_fp16)[name = tensor("out_81_cast_fp16")]; tensor obj_165_gamma_0_to_fp16 = const()[name = tensor("obj_165_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406364352)))]; tensor obj_165_beta_0_to_fp16 = const()[name = tensor("obj_165_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406366976)))]; tensor obj_165_epsilon_0_to_fp16 = const()[name = tensor("obj_165_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_165_cast_fp16 = batch_norm(beta = obj_165_beta_0_to_fp16, epsilon = obj_165_epsilon_0_to_fp16, gamma = obj_165_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_81_cast_fp16)[name = tensor("obj_165_cast_fp16")]; tensor var_3087 = const()[name = tensor("op_3087"), val = tensor([1, 1])]; tensor var_3089 = const()[name = tensor("op_3089"), val = tensor([1, 1])]; tensor query_55_pad_type_0 = const()[name = tensor("query_55_pad_type_0"), val = tensor("custom")]; tensor query_55_pad_0 = const()[name = tensor("query_55_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_13_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(406369600))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(407188864))), name = tensor("layers_13_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_13_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_13_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(407188992)))]; tensor query_55_cast_fp16 = conv(bias = layers_13_encoder_attn_q_proj_bias_to_fp16, dilations = var_3089, groups = var_2965, pad = query_55_pad_0, pad_type = query_55_pad_type_0, strides = var_3087, weight = layers_13_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_165_cast_fp16)[name = tensor("query_55_cast_fp16")]; tensor var_3093 = const()[name = tensor("op_3093"), val = tensor([1, 1])]; tensor var_3095 = const()[name = tensor("op_3095"), val = tensor([1, 1])]; tensor key_55_pad_type_0 = const()[name = tensor("key_55_pad_type_0"), val = tensor("custom")]; tensor key_55_pad_0 = const()[name = tensor("key_55_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_13_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(407191616))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408010880))), name = tensor("layers_13_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_55_cast_fp16 = conv(dilations = var_3095, groups = var_2965, pad = key_55_pad_0, pad_type = key_55_pad_type_0, strides = var_3093, weight = layers_13_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_55_cast_fp16")]; tensor var_3100 = const()[name = tensor("op_3100"), val = tensor([1, 1])]; tensor var_3102 = const()[name = tensor("op_3102"), val = tensor([1, 1])]; tensor value_55_pad_type_0 = const()[name = tensor("value_55_pad_type_0"), val = tensor("custom")]; tensor value_55_pad_0 = const()[name = tensor("value_55_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_13_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408011008))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408830272))), name = tensor("layers_13_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_13_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_13_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408830400)))]; tensor value_55_cast_fp16 = conv(bias = layers_13_encoder_attn_v_proj_bias_to_fp16, dilations = var_3102, groups = var_2965, pad = value_55_pad_0, pad_type = value_55_pad_type_0, strides = var_3100, weight = layers_13_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_55_cast_fp16")]; tensor var_3106 = const()[name = tensor("op_3106"), val = tensor([1, 20, 64, -1])]; tensor var_3107_cast_fp16 = reshape(shape = var_3106, x = query_55_cast_fp16)[name = tensor("op_3107_cast_fp16")]; tensor var_3108_to_fp16 = const()[name = tensor("op_3108_to_fp16"), val = tensor(0x1p-3)]; tensor var_3109_cast_fp16 = mul(x = var_3107_cast_fp16, y = var_3108_to_fp16)[name = tensor("op_3109_cast_fp16")]; tensor var_3110 = const()[name = tensor("op_3110"), val = tensor([1, 20, 64, -1])]; tensor var_3111_cast_fp16 = reshape(shape = var_3110, x = key_55_cast_fp16)[name = tensor("op_3111_cast_fp16")]; tensor mh_w_83_transpose_x_0 = const()[name = tensor("mh_w_83_transpose_x_0"), val = tensor(true)]; tensor mh_w_83_transpose_y_0 = const()[name = tensor("mh_w_83_transpose_y_0"), val = tensor(false)]; tensor mh_w_83_cast_fp16 = matmul(transpose_x = mh_w_83_transpose_x_0, transpose_y = mh_w_83_transpose_y_0, x = var_3109_cast_fp16, y = var_3111_cast_fp16)[name = tensor("mh_w_83_cast_fp16")]; tensor var_3114_cast_fp16 = softmax(axis = var_2958, x = mh_w_83_cast_fp16)[name = tensor("op_3114_cast_fp16")]; tensor var_3115 = const()[name = tensor("op_3115"), val = tensor([1, 20, 64, -1])]; tensor var_3116_cast_fp16 = reshape(shape = var_3115, x = value_55_cast_fp16)[name = tensor("op_3116_cast_fp16")]; tensor attn_55_transpose_x_0 = const()[name = tensor("attn_55_transpose_x_0"), val = tensor(false)]; tensor attn_55_transpose_y_0 = const()[name = tensor("attn_55_transpose_y_0"), val = tensor(true)]; tensor attn_55_cast_fp16 = matmul(transpose_x = attn_55_transpose_x_0, transpose_y = attn_55_transpose_y_0, x = var_3116_cast_fp16, y = var_3114_cast_fp16)[name = tensor("attn_55_cast_fp16")]; tensor var_3119 = const()[name = tensor("op_3119"), val = tensor([1, 1280, 1, -1])]; tensor input_133_cast_fp16 = reshape(shape = var_3119, x = attn_55_cast_fp16)[name = tensor("input_133_cast_fp16")]; tensor var_3123 = const()[name = tensor("op_3123"), val = tensor([1, 1])]; tensor var_3125 = const()[name = tensor("op_3125"), val = tensor([1, 1])]; tensor obj_167_pad_type_0 = const()[name = tensor("obj_167_pad_type_0"), val = tensor("custom")]; tensor obj_167_pad_0 = const()[name = tensor("obj_167_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_13_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(408833024))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(409652288))), name = tensor("layers_13_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_13_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_13_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(409652416)))]; tensor obj_167_cast_fp16 = conv(bias = layers_13_encoder_attn_o_proj_bias_to_fp16, dilations = var_3125, groups = var_2965, pad = obj_167_pad_0, pad_type = obj_167_pad_type_0, strides = var_3123, weight = layers_13_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_133_cast_fp16)[name = tensor("obj_167_cast_fp16")]; tensor inputs_83_cast_fp16 = add(x = inputs_81_cast_fp16, y = obj_167_cast_fp16)[name = tensor("inputs_83_cast_fp16")]; tensor var_3131 = const()[name = tensor("op_3131"), val = tensor([1])]; tensor channels_mean_83_cast_fp16 = reduce_mean(axes = var_3131, keep_dims = var_2966, x = inputs_83_cast_fp16)[name = tensor("channels_mean_83_cast_fp16")]; tensor zero_mean_83_cast_fp16 = sub(x = inputs_83_cast_fp16, y = channels_mean_83_cast_fp16)[name = tensor("zero_mean_83_cast_fp16")]; tensor zero_mean_sq_83_cast_fp16 = mul(x = zero_mean_83_cast_fp16, y = zero_mean_83_cast_fp16)[name = tensor("zero_mean_sq_83_cast_fp16")]; tensor var_3135 = const()[name = tensor("op_3135"), val = tensor([1])]; tensor var_3136_cast_fp16 = reduce_mean(axes = var_3135, keep_dims = var_2966, x = zero_mean_sq_83_cast_fp16)[name = tensor("op_3136_cast_fp16")]; tensor var_3137_to_fp16 = const()[name = tensor("op_3137_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3138_cast_fp16 = add(x = var_3136_cast_fp16, y = var_3137_to_fp16)[name = tensor("op_3138_cast_fp16")]; tensor denom_83_epsilon_0 = const()[name = tensor("denom_83_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_83_cast_fp16 = rsqrt(epsilon = denom_83_epsilon_0, x = var_3138_cast_fp16)[name = tensor("denom_83_cast_fp16")]; tensor out_83_cast_fp16 = mul(x = zero_mean_83_cast_fp16, y = denom_83_cast_fp16)[name = tensor("out_83_cast_fp16")]; tensor input_135_gamma_0_to_fp16 = const()[name = tensor("input_135_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(409655040)))]; tensor input_135_beta_0_to_fp16 = const()[name = tensor("input_135_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(409657664)))]; tensor input_135_epsilon_0_to_fp16 = const()[name = tensor("input_135_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_135_cast_fp16 = batch_norm(beta = input_135_beta_0_to_fp16, epsilon = input_135_epsilon_0_to_fp16, gamma = input_135_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_83_cast_fp16)[name = tensor("input_135_cast_fp16")]; tensor var_3149 = const()[name = tensor("op_3149"), val = tensor([1, 1])]; tensor var_3151 = const()[name = tensor("op_3151"), val = tensor([1, 1])]; tensor input_137_pad_type_0 = const()[name = tensor("input_137_pad_type_0"), val = tensor("custom")]; tensor input_137_pad_0 = const()[name = tensor("input_137_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_13_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(409660288))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(414575552))), name = tensor("layers_13_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_13_fc1_bias_to_fp16 = const()[name = tensor("layers_13_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(414575744)))]; tensor input_137_cast_fp16 = conv(bias = layers_13_fc1_bias_to_fp16, dilations = var_3151, groups = var_2965, pad = input_137_pad_0, pad_type = input_137_pad_type_0, strides = var_3149, weight = layers_13_fc1_weight_to_fp16_palettized, x = input_135_cast_fp16)[name = tensor("input_137_cast_fp16")]; tensor input_139_mode_0 = const()[name = tensor("input_139_mode_0"), val = tensor("EXACT")]; tensor input_139_cast_fp16 = gelu(mode = input_139_mode_0, x = input_137_cast_fp16)[name = tensor("input_139_cast_fp16")]; tensor var_3157 = const()[name = tensor("op_3157"), val = tensor([1, 1])]; tensor var_3159 = const()[name = tensor("op_3159"), val = tensor([1, 1])]; tensor hidden_states_29_pad_type_0 = const()[name = tensor("hidden_states_29_pad_type_0"), val = tensor("custom")]; tensor hidden_states_29_pad_0 = const()[name = tensor("hidden_states_29_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_13_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(414586048))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419501312))), name = tensor("layers_13_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_13_fc2_bias_to_fp16 = const()[name = tensor("layers_13_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419501504)))]; tensor hidden_states_29_cast_fp16 = conv(bias = layers_13_fc2_bias_to_fp16, dilations = var_3159, groups = var_2965, pad = hidden_states_29_pad_0, pad_type = hidden_states_29_pad_type_0, strides = var_3157, weight = layers_13_fc2_weight_to_fp16_palettized, x = input_139_cast_fp16)[name = tensor("hidden_states_29_cast_fp16")]; tensor inputs_85_cast_fp16 = add(x = inputs_83_cast_fp16, y = hidden_states_29_cast_fp16)[name = tensor("inputs_85_cast_fp16")]; tensor var_3172 = const()[name = tensor("op_3172"), val = tensor(3)]; tensor var_3179 = const()[name = tensor("op_3179"), val = tensor(1)]; tensor var_3180 = const()[name = tensor("op_3180"), val = tensor(true)]; tensor var_3192 = const()[name = tensor("op_3192"), val = tensor([1])]; tensor channels_mean_85_cast_fp16 = reduce_mean(axes = var_3192, keep_dims = var_3180, x = inputs_85_cast_fp16)[name = tensor("channels_mean_85_cast_fp16")]; tensor zero_mean_85_cast_fp16 = sub(x = inputs_85_cast_fp16, y = channels_mean_85_cast_fp16)[name = tensor("zero_mean_85_cast_fp16")]; tensor zero_mean_sq_85_cast_fp16 = mul(x = zero_mean_85_cast_fp16, y = zero_mean_85_cast_fp16)[name = tensor("zero_mean_sq_85_cast_fp16")]; tensor var_3196 = const()[name = tensor("op_3196"), val = tensor([1])]; tensor var_3197_cast_fp16 = reduce_mean(axes = var_3196, keep_dims = var_3180, x = zero_mean_sq_85_cast_fp16)[name = tensor("op_3197_cast_fp16")]; tensor var_3198_to_fp16 = const()[name = tensor("op_3198_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3199_cast_fp16 = add(x = var_3197_cast_fp16, y = var_3198_to_fp16)[name = tensor("op_3199_cast_fp16")]; tensor denom_85_epsilon_0 = const()[name = tensor("denom_85_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_85_cast_fp16 = rsqrt(epsilon = denom_85_epsilon_0, x = var_3199_cast_fp16)[name = tensor("denom_85_cast_fp16")]; tensor out_85_cast_fp16 = mul(x = zero_mean_85_cast_fp16, y = denom_85_cast_fp16)[name = tensor("out_85_cast_fp16")]; tensor obj_169_gamma_0_to_fp16 = const()[name = tensor("obj_169_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419504128)))]; tensor obj_169_beta_0_to_fp16 = const()[name = tensor("obj_169_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419506752)))]; tensor obj_169_epsilon_0_to_fp16 = const()[name = tensor("obj_169_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_169_cast_fp16 = batch_norm(beta = obj_169_beta_0_to_fp16, epsilon = obj_169_epsilon_0_to_fp16, gamma = obj_169_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_85_cast_fp16)[name = tensor("obj_169_cast_fp16")]; tensor var_3214 = const()[name = tensor("op_3214"), val = tensor([1, 1])]; tensor var_3216 = const()[name = tensor("op_3216"), val = tensor([1, 1])]; tensor query_57_pad_type_0 = const()[name = tensor("query_57_pad_type_0"), val = tensor("custom")]; tensor query_57_pad_0 = const()[name = tensor("query_57_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_14_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419509376))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(420738240))), name = tensor("layers_14_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_14_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_14_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(420738432)))]; tensor query_57_cast_fp16 = conv(bias = layers_14_self_attn_q_proj_bias_to_fp16, dilations = var_3216, groups = var_3179, pad = query_57_pad_0, pad_type = query_57_pad_type_0, strides = var_3214, weight = layers_14_self_attn_q_proj_weight_to_fp16_palettized, x = obj_169_cast_fp16)[name = tensor("query_57_cast_fp16")]; tensor var_3220 = const()[name = tensor("op_3220"), val = tensor([1, 1])]; tensor var_3222 = const()[name = tensor("op_3222"), val = tensor([1, 1])]; tensor current_key_29_pad_type_0 = const()[name = tensor("current_key_29_pad_type_0"), val = tensor("custom")]; tensor current_key_29_pad_0 = const()[name = tensor("current_key_29_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_14_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(420741056))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421969920))), name = tensor("layers_14_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_29_cast_fp16 = conv(dilations = var_3222, groups = var_3179, pad = current_key_29_pad_0, pad_type = current_key_29_pad_type_0, strides = var_3220, weight = layers_14_self_attn_k_proj_weight_to_fp16_palettized, x = obj_169_cast_fp16)[name = tensor("current_key_29_cast_fp16")]; tensor var_3227 = const()[name = tensor("op_3227"), val = tensor([1, 1])]; tensor var_3229 = const()[name = tensor("op_3229"), val = tensor([1, 1])]; tensor current_value_29_pad_type_0 = const()[name = tensor("current_value_29_pad_type_0"), val = tensor("custom")]; tensor current_value_29_pad_0 = const()[name = tensor("current_value_29_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_14_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421970112))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(422789376))), name = tensor("layers_14_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_14_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_14_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(422789504)))]; tensor current_value_29_cast_fp16 = conv(bias = layers_14_self_attn_v_proj_bias_to_fp16, dilations = var_3229, groups = var_3179, pad = current_value_29_pad_0, pad_type = current_value_29_pad_type_0, strides = var_3227, weight = layers_14_self_attn_v_proj_weight_to_fp16_palettized, x = obj_169_cast_fp16)[name = tensor("current_value_29_cast_fp16")]; tensor var_3236_cast_fp16 = mul(x = current_key_29_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_3236_cast_fp16")]; tensor var_3238_cast_fp16 = mul(x = var_103_cast_fp16_14, y = var_241_cast_fp16)[name = tensor("op_3238_cast_fp16")]; tensor key_57_cast_fp16 = add(x = var_3236_cast_fp16, y = var_3238_cast_fp16)[name = tensor("key_57_cast_fp16")]; tensor var_3240_cast_fp16 = mul(x = current_value_29_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_3240_cast_fp16")]; tensor var_3242_cast_fp16 = mul(x = var_138_cast_fp16_14, y = var_241_cast_fp16)[name = tensor("op_3242_cast_fp16")]; tensor value_57_cast_fp16 = add(x = var_3240_cast_fp16, y = var_3242_cast_fp16)[name = tensor("value_57_cast_fp16")]; tensor var_3245 = const()[name = tensor("op_3245"), val = tensor([1, 20, 64, -1])]; tensor var_3246_cast_fp16 = reshape(shape = var_3245, x = query_57_cast_fp16)[name = tensor("op_3246_cast_fp16")]; tensor var_3247_to_fp16 = const()[name = tensor("op_3247_to_fp16"), val = tensor(0x1p-3)]; tensor var_3248_cast_fp16 = mul(x = var_3246_cast_fp16, y = var_3247_to_fp16)[name = tensor("op_3248_cast_fp16")]; tensor var_3249 = const()[name = tensor("op_3249"), val = tensor([1, 20, 64, -1])]; tensor var_3250_cast_fp16 = reshape(shape = var_3249, x = key_57_cast_fp16)[name = tensor("op_3250_cast_fp16")]; tensor mh_w_85_transpose_x_0 = const()[name = tensor("mh_w_85_transpose_x_0"), val = tensor(true)]; tensor mh_w_85_transpose_y_0 = const()[name = tensor("mh_w_85_transpose_y_0"), val = tensor(false)]; tensor mh_w_85_cast_fp16 = matmul(transpose_x = mh_w_85_transpose_x_0, transpose_y = mh_w_85_transpose_y_0, x = var_3248_cast_fp16, y = var_3250_cast_fp16)[name = tensor("mh_w_85_cast_fp16")]; tensor mh_w_87_cast_fp16 = add(x = mh_w_85_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_87_cast_fp16")]; tensor var_3258_cast_fp16 = softmax(axis = var_3172, x = mh_w_87_cast_fp16)[name = tensor("op_3258_cast_fp16")]; tensor var_3259 = const()[name = tensor("op_3259"), val = tensor([1, 20, 64, -1])]; tensor var_3260_cast_fp16 = reshape(shape = var_3259, x = value_57_cast_fp16)[name = tensor("op_3260_cast_fp16")]; tensor attn_57_transpose_x_0 = const()[name = tensor("attn_57_transpose_x_0"), val = tensor(false)]; tensor attn_57_transpose_y_0 = const()[name = tensor("attn_57_transpose_y_0"), val = tensor(true)]; tensor attn_57_cast_fp16 = matmul(transpose_x = attn_57_transpose_x_0, transpose_y = attn_57_transpose_y_0, x = var_3260_cast_fp16, y = var_3258_cast_fp16)[name = tensor("attn_57_cast_fp16")]; tensor var_3263 = const()[name = tensor("op_3263"), val = tensor([1, 1280, 1, -1])]; tensor input_141_cast_fp16 = reshape(shape = var_3263, x = attn_57_cast_fp16)[name = tensor("input_141_cast_fp16")]; tensor var_3267 = const()[name = tensor("op_3267"), val = tensor([1, 1])]; tensor var_3269 = const()[name = tensor("op_3269"), val = tensor([1, 1])]; tensor obj_175_pad_type_0 = const()[name = tensor("obj_175_pad_type_0"), val = tensor("custom")]; tensor obj_175_pad_0 = const()[name = tensor("obj_175_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_14_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(422792128))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(423611392))), name = tensor("layers_14_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_14_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_14_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(423611520)))]; tensor obj_175_cast_fp16 = conv(bias = layers_14_self_attn_o_proj_bias_to_fp16, dilations = var_3269, groups = var_3179, pad = obj_175_pad_0, pad_type = obj_175_pad_type_0, strides = var_3267, weight = layers_14_self_attn_o_proj_weight_to_fp16_palettized, x = input_141_cast_fp16)[name = tensor("obj_175_cast_fp16")]; tensor inputs_87_cast_fp16 = add(x = inputs_85_cast_fp16, y = obj_175_cast_fp16)[name = tensor("inputs_87_cast_fp16")]; tensor var_3279 = const()[name = tensor("op_3279"), val = tensor([1])]; tensor channels_mean_87_cast_fp16 = reduce_mean(axes = var_3279, keep_dims = var_3180, x = inputs_87_cast_fp16)[name = tensor("channels_mean_87_cast_fp16")]; tensor zero_mean_87_cast_fp16 = sub(x = inputs_87_cast_fp16, y = channels_mean_87_cast_fp16)[name = tensor("zero_mean_87_cast_fp16")]; tensor zero_mean_sq_87_cast_fp16 = mul(x = zero_mean_87_cast_fp16, y = zero_mean_87_cast_fp16)[name = tensor("zero_mean_sq_87_cast_fp16")]; tensor var_3283 = const()[name = tensor("op_3283"), val = tensor([1])]; tensor var_3284_cast_fp16 = reduce_mean(axes = var_3283, keep_dims = var_3180, x = zero_mean_sq_87_cast_fp16)[name = tensor("op_3284_cast_fp16")]; tensor var_3285_to_fp16 = const()[name = tensor("op_3285_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3286_cast_fp16 = add(x = var_3284_cast_fp16, y = var_3285_to_fp16)[name = tensor("op_3286_cast_fp16")]; tensor denom_87_epsilon_0 = const()[name = tensor("denom_87_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_87_cast_fp16 = rsqrt(epsilon = denom_87_epsilon_0, x = var_3286_cast_fp16)[name = tensor("denom_87_cast_fp16")]; tensor out_87_cast_fp16 = mul(x = zero_mean_87_cast_fp16, y = denom_87_cast_fp16)[name = tensor("out_87_cast_fp16")]; tensor obj_177_gamma_0_to_fp16 = const()[name = tensor("obj_177_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(423614144)))]; tensor obj_177_beta_0_to_fp16 = const()[name = tensor("obj_177_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(423616768)))]; tensor obj_177_epsilon_0_to_fp16 = const()[name = tensor("obj_177_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_177_cast_fp16 = batch_norm(beta = obj_177_beta_0_to_fp16, epsilon = obj_177_epsilon_0_to_fp16, gamma = obj_177_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_87_cast_fp16)[name = tensor("obj_177_cast_fp16")]; tensor var_3301 = const()[name = tensor("op_3301"), val = tensor([1, 1])]; tensor var_3303 = const()[name = tensor("op_3303"), val = tensor([1, 1])]; tensor query_59_pad_type_0 = const()[name = tensor("query_59_pad_type_0"), val = tensor("custom")]; tensor query_59_pad_0 = const()[name = tensor("query_59_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_14_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(423619392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(424848256))), name = tensor("layers_14_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_14_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_14_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(424848448)))]; tensor query_59_cast_fp16 = conv(bias = layers_14_encoder_attn_q_proj_bias_to_fp16, dilations = var_3303, groups = var_3179, pad = query_59_pad_0, pad_type = query_59_pad_type_0, strides = var_3301, weight = layers_14_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_177_cast_fp16)[name = tensor("query_59_cast_fp16")]; tensor var_3307 = const()[name = tensor("op_3307"), val = tensor([1, 1])]; tensor var_3309 = const()[name = tensor("op_3309"), val = tensor([1, 1])]; tensor key_59_pad_type_0 = const()[name = tensor("key_59_pad_type_0"), val = tensor("custom")]; tensor key_59_pad_0 = const()[name = tensor("key_59_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_14_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(424851072))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(425670336))), name = tensor("layers_14_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_59_cast_fp16 = conv(dilations = var_3309, groups = var_3179, pad = key_59_pad_0, pad_type = key_59_pad_type_0, strides = var_3307, weight = layers_14_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_59_cast_fp16")]; tensor var_3314 = const()[name = tensor("op_3314"), val = tensor([1, 1])]; tensor var_3316 = const()[name = tensor("op_3316"), val = tensor([1, 1])]; tensor value_59_pad_type_0 = const()[name = tensor("value_59_pad_type_0"), val = tensor("custom")]; tensor value_59_pad_0 = const()[name = tensor("value_59_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_14_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(425670464))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(426489728))), name = tensor("layers_14_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_14_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_14_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(426489856)))]; tensor value_59_cast_fp16 = conv(bias = layers_14_encoder_attn_v_proj_bias_to_fp16, dilations = var_3316, groups = var_3179, pad = value_59_pad_0, pad_type = value_59_pad_type_0, strides = var_3314, weight = layers_14_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_59_cast_fp16")]; tensor var_3320 = const()[name = tensor("op_3320"), val = tensor([1, 20, 64, -1])]; tensor var_3321_cast_fp16 = reshape(shape = var_3320, x = query_59_cast_fp16)[name = tensor("op_3321_cast_fp16")]; tensor var_3322_to_fp16 = const()[name = tensor("op_3322_to_fp16"), val = tensor(0x1p-3)]; tensor var_3323_cast_fp16 = mul(x = var_3321_cast_fp16, y = var_3322_to_fp16)[name = tensor("op_3323_cast_fp16")]; tensor var_3324 = const()[name = tensor("op_3324"), val = tensor([1, 20, 64, -1])]; tensor var_3325_cast_fp16 = reshape(shape = var_3324, x = key_59_cast_fp16)[name = tensor("op_3325_cast_fp16")]; tensor mh_w_89_transpose_x_0 = const()[name = tensor("mh_w_89_transpose_x_0"), val = tensor(true)]; tensor mh_w_89_transpose_y_0 = const()[name = tensor("mh_w_89_transpose_y_0"), val = tensor(false)]; tensor mh_w_89_cast_fp16 = matmul(transpose_x = mh_w_89_transpose_x_0, transpose_y = mh_w_89_transpose_y_0, x = var_3323_cast_fp16, y = var_3325_cast_fp16)[name = tensor("mh_w_89_cast_fp16")]; tensor var_3328_cast_fp16 = softmax(axis = var_3172, x = mh_w_89_cast_fp16)[name = tensor("op_3328_cast_fp16")]; tensor var_3329 = const()[name = tensor("op_3329"), val = tensor([1, 20, 64, -1])]; tensor var_3330_cast_fp16 = reshape(shape = var_3329, x = value_59_cast_fp16)[name = tensor("op_3330_cast_fp16")]; tensor attn_59_transpose_x_0 = const()[name = tensor("attn_59_transpose_x_0"), val = tensor(false)]; tensor attn_59_transpose_y_0 = const()[name = tensor("attn_59_transpose_y_0"), val = tensor(true)]; tensor attn_59_cast_fp16 = matmul(transpose_x = attn_59_transpose_x_0, transpose_y = attn_59_transpose_y_0, x = var_3330_cast_fp16, y = var_3328_cast_fp16)[name = tensor("attn_59_cast_fp16")]; tensor var_3333 = const()[name = tensor("op_3333"), val = tensor([1, 1280, 1, -1])]; tensor input_143_cast_fp16 = reshape(shape = var_3333, x = attn_59_cast_fp16)[name = tensor("input_143_cast_fp16")]; tensor var_3337 = const()[name = tensor("op_3337"), val = tensor([1, 1])]; tensor var_3339 = const()[name = tensor("op_3339"), val = tensor([1, 1])]; tensor obj_179_pad_type_0 = const()[name = tensor("obj_179_pad_type_0"), val = tensor("custom")]; tensor obj_179_pad_0 = const()[name = tensor("obj_179_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_14_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(426492480))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(427721344))), name = tensor("layers_14_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_14_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_14_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(427721536)))]; tensor obj_179_cast_fp16 = conv(bias = layers_14_encoder_attn_o_proj_bias_to_fp16, dilations = var_3339, groups = var_3179, pad = obj_179_pad_0, pad_type = obj_179_pad_type_0, strides = var_3337, weight = layers_14_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_143_cast_fp16)[name = tensor("obj_179_cast_fp16")]; tensor inputs_89_cast_fp16 = add(x = inputs_87_cast_fp16, y = obj_179_cast_fp16)[name = tensor("inputs_89_cast_fp16")]; tensor var_3345 = const()[name = tensor("op_3345"), val = tensor([1])]; tensor channels_mean_89_cast_fp16 = reduce_mean(axes = var_3345, keep_dims = var_3180, x = inputs_89_cast_fp16)[name = tensor("channels_mean_89_cast_fp16")]; tensor zero_mean_89_cast_fp16 = sub(x = inputs_89_cast_fp16, y = channels_mean_89_cast_fp16)[name = tensor("zero_mean_89_cast_fp16")]; tensor zero_mean_sq_89_cast_fp16 = mul(x = zero_mean_89_cast_fp16, y = zero_mean_89_cast_fp16)[name = tensor("zero_mean_sq_89_cast_fp16")]; tensor var_3349 = const()[name = tensor("op_3349"), val = tensor([1])]; tensor var_3350_cast_fp16 = reduce_mean(axes = var_3349, keep_dims = var_3180, x = zero_mean_sq_89_cast_fp16)[name = tensor("op_3350_cast_fp16")]; tensor var_3351_to_fp16 = const()[name = tensor("op_3351_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3352_cast_fp16 = add(x = var_3350_cast_fp16, y = var_3351_to_fp16)[name = tensor("op_3352_cast_fp16")]; tensor denom_89_epsilon_0 = const()[name = tensor("denom_89_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_89_cast_fp16 = rsqrt(epsilon = denom_89_epsilon_0, x = var_3352_cast_fp16)[name = tensor("denom_89_cast_fp16")]; tensor out_89_cast_fp16 = mul(x = zero_mean_89_cast_fp16, y = denom_89_cast_fp16)[name = tensor("out_89_cast_fp16")]; tensor input_145_gamma_0_to_fp16 = const()[name = tensor("input_145_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(427724160)))]; tensor input_145_beta_0_to_fp16 = const()[name = tensor("input_145_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(427726784)))]; tensor input_145_epsilon_0_to_fp16 = const()[name = tensor("input_145_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_145_cast_fp16 = batch_norm(beta = input_145_beta_0_to_fp16, epsilon = input_145_epsilon_0_to_fp16, gamma = input_145_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_89_cast_fp16)[name = tensor("input_145_cast_fp16")]; tensor var_3363 = const()[name = tensor("op_3363"), val = tensor([1, 1])]; tensor var_3365 = const()[name = tensor("op_3365"), val = tensor([1, 1])]; tensor input_147_pad_type_0 = const()[name = tensor("input_147_pad_type_0"), val = tensor("custom")]; tensor input_147_pad_0 = const()[name = tensor("input_147_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_14_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(427729408))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(432644672))), name = tensor("layers_14_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_14_fc1_bias_to_fp16 = const()[name = tensor("layers_14_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(432644864)))]; tensor input_147_cast_fp16 = conv(bias = layers_14_fc1_bias_to_fp16, dilations = var_3365, groups = var_3179, pad = input_147_pad_0, pad_type = input_147_pad_type_0, strides = var_3363, weight = layers_14_fc1_weight_to_fp16_palettized, x = input_145_cast_fp16)[name = tensor("input_147_cast_fp16")]; tensor input_149_mode_0 = const()[name = tensor("input_149_mode_0"), val = tensor("EXACT")]; tensor input_149_cast_fp16 = gelu(mode = input_149_mode_0, x = input_147_cast_fp16)[name = tensor("input_149_cast_fp16")]; tensor var_3371 = const()[name = tensor("op_3371"), val = tensor([1, 1])]; tensor var_3373 = const()[name = tensor("op_3373"), val = tensor([1, 1])]; tensor hidden_states_31_pad_type_0 = const()[name = tensor("hidden_states_31_pad_type_0"), val = tensor("custom")]; tensor hidden_states_31_pad_0 = const()[name = tensor("hidden_states_31_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_14_fc2_weight_to_fp16 = const()[name = tensor("layers_14_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(432655168)))]; tensor layers_14_fc2_bias_to_fp16 = const()[name = tensor("layers_14_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445762432)))]; tensor hidden_states_31_cast_fp16 = conv(bias = layers_14_fc2_bias_to_fp16, dilations = var_3373, groups = var_3179, pad = hidden_states_31_pad_0, pad_type = hidden_states_31_pad_type_0, strides = var_3371, weight = layers_14_fc2_weight_to_fp16, x = input_149_cast_fp16)[name = tensor("hidden_states_31_cast_fp16")]; tensor inputs_91_cast_fp16 = add(x = inputs_89_cast_fp16, y = hidden_states_31_cast_fp16)[name = tensor("inputs_91_cast_fp16")]; tensor var_3386 = const()[name = tensor("op_3386"), val = tensor(3)]; tensor var_3393 = const()[name = tensor("op_3393"), val = tensor(1)]; tensor var_3394 = const()[name = tensor("op_3394"), val = tensor(true)]; tensor var_3406 = const()[name = tensor("op_3406"), val = tensor([1])]; tensor channels_mean_91_cast_fp16 = reduce_mean(axes = var_3406, keep_dims = var_3394, x = inputs_91_cast_fp16)[name = tensor("channels_mean_91_cast_fp16")]; tensor zero_mean_91_cast_fp16 = sub(x = inputs_91_cast_fp16, y = channels_mean_91_cast_fp16)[name = tensor("zero_mean_91_cast_fp16")]; tensor zero_mean_sq_91_cast_fp16 = mul(x = zero_mean_91_cast_fp16, y = zero_mean_91_cast_fp16)[name = tensor("zero_mean_sq_91_cast_fp16")]; tensor var_3410 = const()[name = tensor("op_3410"), val = tensor([1])]; tensor var_3411_cast_fp16 = reduce_mean(axes = var_3410, keep_dims = var_3394, x = zero_mean_sq_91_cast_fp16)[name = tensor("op_3411_cast_fp16")]; tensor var_3412_to_fp16 = const()[name = tensor("op_3412_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3413_cast_fp16 = add(x = var_3411_cast_fp16, y = var_3412_to_fp16)[name = tensor("op_3413_cast_fp16")]; tensor denom_91_epsilon_0 = const()[name = tensor("denom_91_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_91_cast_fp16 = rsqrt(epsilon = denom_91_epsilon_0, x = var_3413_cast_fp16)[name = tensor("denom_91_cast_fp16")]; tensor out_91_cast_fp16 = mul(x = zero_mean_91_cast_fp16, y = denom_91_cast_fp16)[name = tensor("out_91_cast_fp16")]; tensor obj_181_gamma_0_to_fp16 = const()[name = tensor("obj_181_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445765056)))]; tensor obj_181_beta_0_to_fp16 = const()[name = tensor("obj_181_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445767680)))]; tensor obj_181_epsilon_0_to_fp16 = const()[name = tensor("obj_181_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_181_cast_fp16 = batch_norm(beta = obj_181_beta_0_to_fp16, epsilon = obj_181_epsilon_0_to_fp16, gamma = obj_181_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_91_cast_fp16)[name = tensor("obj_181_cast_fp16")]; tensor var_3428 = const()[name = tensor("op_3428"), val = tensor([1, 1])]; tensor var_3430 = const()[name = tensor("op_3430"), val = tensor([1, 1])]; tensor query_61_pad_type_0 = const()[name = tensor("query_61_pad_type_0"), val = tensor("custom")]; tensor query_61_pad_0 = const()[name = tensor("query_61_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_15_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445770304))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446999168))), name = tensor("layers_15_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_15_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_15_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446999360)))]; tensor query_61_cast_fp16 = conv(bias = layers_15_self_attn_q_proj_bias_to_fp16, dilations = var_3430, groups = var_3393, pad = query_61_pad_0, pad_type = query_61_pad_type_0, strides = var_3428, weight = layers_15_self_attn_q_proj_weight_to_fp16_palettized, x = obj_181_cast_fp16)[name = tensor("query_61_cast_fp16")]; tensor var_3434 = const()[name = tensor("op_3434"), val = tensor([1, 1])]; tensor var_3436 = const()[name = tensor("op_3436"), val = tensor([1, 1])]; tensor current_key_31_pad_type_0 = const()[name = tensor("current_key_31_pad_type_0"), val = tensor("custom")]; tensor current_key_31_pad_0 = const()[name = tensor("current_key_31_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_15_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(447001984))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(447821248))), name = tensor("layers_15_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_31_cast_fp16 = conv(dilations = var_3436, groups = var_3393, pad = current_key_31_pad_0, pad_type = current_key_31_pad_type_0, strides = var_3434, weight = layers_15_self_attn_k_proj_weight_to_fp16_palettized, x = obj_181_cast_fp16)[name = tensor("current_key_31_cast_fp16")]; tensor var_3441 = const()[name = tensor("op_3441"), val = tensor([1, 1])]; tensor var_3443 = const()[name = tensor("op_3443"), val = tensor([1, 1])]; tensor current_value_31_pad_type_0 = const()[name = tensor("current_value_31_pad_type_0"), val = tensor("custom")]; tensor current_value_31_pad_0 = const()[name = tensor("current_value_31_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_15_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(447821376))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448640640))), name = tensor("layers_15_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_15_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_15_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448640768)))]; tensor current_value_31_cast_fp16 = conv(bias = layers_15_self_attn_v_proj_bias_to_fp16, dilations = var_3443, groups = var_3393, pad = current_value_31_pad_0, pad_type = current_value_31_pad_type_0, strides = var_3441, weight = layers_15_self_attn_v_proj_weight_to_fp16_palettized, x = obj_181_cast_fp16)[name = tensor("current_value_31_cast_fp16")]; tensor var_3450_cast_fp16 = mul(x = current_key_31_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_3450_cast_fp16")]; tensor var_3452_cast_fp16 = mul(x = var_103_cast_fp16_15, y = var_241_cast_fp16)[name = tensor("op_3452_cast_fp16")]; tensor key_61_cast_fp16 = add(x = var_3450_cast_fp16, y = var_3452_cast_fp16)[name = tensor("key_61_cast_fp16")]; tensor var_3454_cast_fp16 = mul(x = current_value_31_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_3454_cast_fp16")]; tensor var_3456_cast_fp16 = mul(x = var_138_cast_fp16_15, y = var_241_cast_fp16)[name = tensor("op_3456_cast_fp16")]; tensor value_61_cast_fp16 = add(x = var_3454_cast_fp16, y = var_3456_cast_fp16)[name = tensor("value_61_cast_fp16")]; tensor var_3459 = const()[name = tensor("op_3459"), val = tensor([1, 20, 64, -1])]; tensor var_3460_cast_fp16 = reshape(shape = var_3459, x = query_61_cast_fp16)[name = tensor("op_3460_cast_fp16")]; tensor var_3461_to_fp16 = const()[name = tensor("op_3461_to_fp16"), val = tensor(0x1p-3)]; tensor var_3462_cast_fp16 = mul(x = var_3460_cast_fp16, y = var_3461_to_fp16)[name = tensor("op_3462_cast_fp16")]; tensor var_3463 = const()[name = tensor("op_3463"), val = tensor([1, 20, 64, -1])]; tensor var_3464_cast_fp16 = reshape(shape = var_3463, x = key_61_cast_fp16)[name = tensor("op_3464_cast_fp16")]; tensor mh_w_91_transpose_x_0 = const()[name = tensor("mh_w_91_transpose_x_0"), val = tensor(true)]; tensor mh_w_91_transpose_y_0 = const()[name = tensor("mh_w_91_transpose_y_0"), val = tensor(false)]; tensor mh_w_91_cast_fp16 = matmul(transpose_x = mh_w_91_transpose_x_0, transpose_y = mh_w_91_transpose_y_0, x = var_3462_cast_fp16, y = var_3464_cast_fp16)[name = tensor("mh_w_91_cast_fp16")]; tensor mh_w_93_cast_fp16 = add(x = mh_w_91_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_93_cast_fp16")]; tensor var_3472_cast_fp16 = softmax(axis = var_3386, x = mh_w_93_cast_fp16)[name = tensor("op_3472_cast_fp16")]; tensor var_3473 = const()[name = tensor("op_3473"), val = tensor([1, 20, 64, -1])]; tensor var_3474_cast_fp16 = reshape(shape = var_3473, x = value_61_cast_fp16)[name = tensor("op_3474_cast_fp16")]; tensor attn_61_transpose_x_0 = const()[name = tensor("attn_61_transpose_x_0"), val = tensor(false)]; tensor attn_61_transpose_y_0 = const()[name = tensor("attn_61_transpose_y_0"), val = tensor(true)]; tensor attn_61_cast_fp16 = matmul(transpose_x = attn_61_transpose_x_0, transpose_y = attn_61_transpose_y_0, x = var_3474_cast_fp16, y = var_3472_cast_fp16)[name = tensor("attn_61_cast_fp16")]; tensor var_3477 = const()[name = tensor("op_3477"), val = tensor([1, 1280, 1, -1])]; tensor input_151_cast_fp16 = reshape(shape = var_3477, x = attn_61_cast_fp16)[name = tensor("input_151_cast_fp16")]; tensor var_3481 = const()[name = tensor("op_3481"), val = tensor([1, 1])]; tensor var_3483 = const()[name = tensor("op_3483"), val = tensor([1, 1])]; tensor obj_187_pad_type_0 = const()[name = tensor("obj_187_pad_type_0"), val = tensor("custom")]; tensor obj_187_pad_0 = const()[name = tensor("obj_187_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_15_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448643392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(449872256))), name = tensor("layers_15_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_15_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_15_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(449872448)))]; tensor obj_187_cast_fp16 = conv(bias = layers_15_self_attn_o_proj_bias_to_fp16, dilations = var_3483, groups = var_3393, pad = obj_187_pad_0, pad_type = obj_187_pad_type_0, strides = var_3481, weight = layers_15_self_attn_o_proj_weight_to_fp16_palettized, x = input_151_cast_fp16)[name = tensor("obj_187_cast_fp16")]; tensor inputs_93_cast_fp16 = add(x = inputs_91_cast_fp16, y = obj_187_cast_fp16)[name = tensor("inputs_93_cast_fp16")]; tensor var_3493 = const()[name = tensor("op_3493"), val = tensor([1])]; tensor channels_mean_93_cast_fp16 = reduce_mean(axes = var_3493, keep_dims = var_3394, x = inputs_93_cast_fp16)[name = tensor("channels_mean_93_cast_fp16")]; tensor zero_mean_93_cast_fp16 = sub(x = inputs_93_cast_fp16, y = channels_mean_93_cast_fp16)[name = tensor("zero_mean_93_cast_fp16")]; tensor zero_mean_sq_93_cast_fp16 = mul(x = zero_mean_93_cast_fp16, y = zero_mean_93_cast_fp16)[name = tensor("zero_mean_sq_93_cast_fp16")]; tensor var_3497 = const()[name = tensor("op_3497"), val = tensor([1])]; tensor var_3498_cast_fp16 = reduce_mean(axes = var_3497, keep_dims = var_3394, x = zero_mean_sq_93_cast_fp16)[name = tensor("op_3498_cast_fp16")]; tensor var_3499_to_fp16 = const()[name = tensor("op_3499_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3500_cast_fp16 = add(x = var_3498_cast_fp16, y = var_3499_to_fp16)[name = tensor("op_3500_cast_fp16")]; tensor denom_93_epsilon_0 = const()[name = tensor("denom_93_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_93_cast_fp16 = rsqrt(epsilon = denom_93_epsilon_0, x = var_3500_cast_fp16)[name = tensor("denom_93_cast_fp16")]; tensor out_93_cast_fp16 = mul(x = zero_mean_93_cast_fp16, y = denom_93_cast_fp16)[name = tensor("out_93_cast_fp16")]; tensor obj_189_gamma_0_to_fp16 = const()[name = tensor("obj_189_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(449875072)))]; tensor obj_189_beta_0_to_fp16 = const()[name = tensor("obj_189_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(449877696)))]; tensor obj_189_epsilon_0_to_fp16 = const()[name = tensor("obj_189_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_189_cast_fp16 = batch_norm(beta = obj_189_beta_0_to_fp16, epsilon = obj_189_epsilon_0_to_fp16, gamma = obj_189_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_93_cast_fp16)[name = tensor("obj_189_cast_fp16")]; tensor var_3515 = const()[name = tensor("op_3515"), val = tensor([1, 1])]; tensor var_3517 = const()[name = tensor("op_3517"), val = tensor([1, 1])]; tensor query_63_pad_type_0 = const()[name = tensor("query_63_pad_type_0"), val = tensor("custom")]; tensor query_63_pad_0 = const()[name = tensor("query_63_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_15_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(449880320))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(451109184))), name = tensor("layers_15_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_15_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_15_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(451109376)))]; tensor query_63_cast_fp16 = conv(bias = layers_15_encoder_attn_q_proj_bias_to_fp16, dilations = var_3517, groups = var_3393, pad = query_63_pad_0, pad_type = query_63_pad_type_0, strides = var_3515, weight = layers_15_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_189_cast_fp16)[name = tensor("query_63_cast_fp16")]; tensor var_3521 = const()[name = tensor("op_3521"), val = tensor([1, 1])]; tensor var_3523 = const()[name = tensor("op_3523"), val = tensor([1, 1])]; tensor key_63_pad_type_0 = const()[name = tensor("key_63_pad_type_0"), val = tensor("custom")]; tensor key_63_pad_0 = const()[name = tensor("key_63_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_15_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(451112000))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(452340864))), name = tensor("layers_15_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_63_cast_fp16 = conv(dilations = var_3523, groups = var_3393, pad = key_63_pad_0, pad_type = key_63_pad_type_0, strides = var_3521, weight = layers_15_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_63_cast_fp16")]; tensor var_3528 = const()[name = tensor("op_3528"), val = tensor([1, 1])]; tensor var_3530 = const()[name = tensor("op_3530"), val = tensor([1, 1])]; tensor value_63_pad_type_0 = const()[name = tensor("value_63_pad_type_0"), val = tensor("custom")]; tensor value_63_pad_0 = const()[name = tensor("value_63_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_15_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(452341056))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(453569920))), name = tensor("layers_15_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_15_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_15_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(453570112)))]; tensor value_63_cast_fp16 = conv(bias = layers_15_encoder_attn_v_proj_bias_to_fp16, dilations = var_3530, groups = var_3393, pad = value_63_pad_0, pad_type = value_63_pad_type_0, strides = var_3528, weight = layers_15_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_63_cast_fp16")]; tensor var_3534 = const()[name = tensor("op_3534"), val = tensor([1, 20, 64, -1])]; tensor var_3535_cast_fp16 = reshape(shape = var_3534, x = query_63_cast_fp16)[name = tensor("op_3535_cast_fp16")]; tensor var_3536_to_fp16 = const()[name = tensor("op_3536_to_fp16"), val = tensor(0x1p-3)]; tensor var_3537_cast_fp16 = mul(x = var_3535_cast_fp16, y = var_3536_to_fp16)[name = tensor("op_3537_cast_fp16")]; tensor var_3538 = const()[name = tensor("op_3538"), val = tensor([1, 20, 64, -1])]; tensor var_3539_cast_fp16 = reshape(shape = var_3538, x = key_63_cast_fp16)[name = tensor("op_3539_cast_fp16")]; tensor mh_w_95_transpose_x_0 = const()[name = tensor("mh_w_95_transpose_x_0"), val = tensor(true)]; tensor mh_w_95_transpose_y_0 = const()[name = tensor("mh_w_95_transpose_y_0"), val = tensor(false)]; tensor mh_w_95_cast_fp16 = matmul(transpose_x = mh_w_95_transpose_x_0, transpose_y = mh_w_95_transpose_y_0, x = var_3537_cast_fp16, y = var_3539_cast_fp16)[name = tensor("mh_w_95_cast_fp16")]; tensor var_3542_cast_fp16 = softmax(axis = var_3386, x = mh_w_95_cast_fp16)[name = tensor("op_3542_cast_fp16")]; tensor var_3543 = const()[name = tensor("op_3543"), val = tensor([1, 20, 64, -1])]; tensor var_3544_cast_fp16 = reshape(shape = var_3543, x = value_63_cast_fp16)[name = tensor("op_3544_cast_fp16")]; tensor attn_63_transpose_x_0 = const()[name = tensor("attn_63_transpose_x_0"), val = tensor(false)]; tensor attn_63_transpose_y_0 = const()[name = tensor("attn_63_transpose_y_0"), val = tensor(true)]; tensor attn_63_cast_fp16 = matmul(transpose_x = attn_63_transpose_x_0, transpose_y = attn_63_transpose_y_0, x = var_3544_cast_fp16, y = var_3542_cast_fp16)[name = tensor("attn_63_cast_fp16")]; tensor var_3547 = const()[name = tensor("op_3547"), val = tensor([1, 1280, 1, -1])]; tensor input_153_cast_fp16 = reshape(shape = var_3547, x = attn_63_cast_fp16)[name = tensor("input_153_cast_fp16")]; tensor var_3551 = const()[name = tensor("op_3551"), val = tensor([1, 1])]; tensor var_3553 = const()[name = tensor("op_3553"), val = tensor([1, 1])]; tensor obj_191_pad_type_0 = const()[name = tensor("obj_191_pad_type_0"), val = tensor("custom")]; tensor obj_191_pad_0 = const()[name = tensor("obj_191_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_15_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(453572736))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454801600))), name = tensor("layers_15_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_15_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_15_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454801792)))]; tensor obj_191_cast_fp16 = conv(bias = layers_15_encoder_attn_o_proj_bias_to_fp16, dilations = var_3553, groups = var_3393, pad = obj_191_pad_0, pad_type = obj_191_pad_type_0, strides = var_3551, weight = layers_15_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_153_cast_fp16)[name = tensor("obj_191_cast_fp16")]; tensor inputs_95_cast_fp16 = add(x = inputs_93_cast_fp16, y = obj_191_cast_fp16)[name = tensor("inputs_95_cast_fp16")]; tensor var_3559 = const()[name = tensor("op_3559"), val = tensor([1])]; tensor channels_mean_95_cast_fp16 = reduce_mean(axes = var_3559, keep_dims = var_3394, x = inputs_95_cast_fp16)[name = tensor("channels_mean_95_cast_fp16")]; tensor zero_mean_95_cast_fp16 = sub(x = inputs_95_cast_fp16, y = channels_mean_95_cast_fp16)[name = tensor("zero_mean_95_cast_fp16")]; tensor zero_mean_sq_95_cast_fp16 = mul(x = zero_mean_95_cast_fp16, y = zero_mean_95_cast_fp16)[name = tensor("zero_mean_sq_95_cast_fp16")]; tensor var_3563 = const()[name = tensor("op_3563"), val = tensor([1])]; tensor var_3564_cast_fp16 = reduce_mean(axes = var_3563, keep_dims = var_3394, x = zero_mean_sq_95_cast_fp16)[name = tensor("op_3564_cast_fp16")]; tensor var_3565_to_fp16 = const()[name = tensor("op_3565_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3566_cast_fp16 = add(x = var_3564_cast_fp16, y = var_3565_to_fp16)[name = tensor("op_3566_cast_fp16")]; tensor denom_95_epsilon_0 = const()[name = tensor("denom_95_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_95_cast_fp16 = rsqrt(epsilon = denom_95_epsilon_0, x = var_3566_cast_fp16)[name = tensor("denom_95_cast_fp16")]; tensor out_95_cast_fp16 = mul(x = zero_mean_95_cast_fp16, y = denom_95_cast_fp16)[name = tensor("out_95_cast_fp16")]; tensor input_155_gamma_0_to_fp16 = const()[name = tensor("input_155_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454804416)))]; tensor input_155_beta_0_to_fp16 = const()[name = tensor("input_155_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454807040)))]; tensor input_155_epsilon_0_to_fp16 = const()[name = tensor("input_155_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_155_cast_fp16 = batch_norm(beta = input_155_beta_0_to_fp16, epsilon = input_155_epsilon_0_to_fp16, gamma = input_155_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_95_cast_fp16)[name = tensor("input_155_cast_fp16")]; tensor var_3577 = const()[name = tensor("op_3577"), val = tensor([1, 1])]; tensor var_3579 = const()[name = tensor("op_3579"), val = tensor([1, 1])]; tensor input_157_pad_type_0 = const()[name = tensor("input_157_pad_type_0"), val = tensor("custom")]; tensor input_157_pad_0 = const()[name = tensor("input_157_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_15_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454809664))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(461363328))), name = tensor("layers_15_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_15_fc1_bias_to_fp16 = const()[name = tensor("layers_15_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(461363904)))]; tensor input_157_cast_fp16 = conv(bias = layers_15_fc1_bias_to_fp16, dilations = var_3579, groups = var_3393, pad = input_157_pad_0, pad_type = input_157_pad_type_0, strides = var_3577, weight = layers_15_fc1_weight_to_fp16_palettized, x = input_155_cast_fp16)[name = tensor("input_157_cast_fp16")]; tensor input_159_mode_0 = const()[name = tensor("input_159_mode_0"), val = tensor("EXACT")]; tensor input_159_cast_fp16 = gelu(mode = input_159_mode_0, x = input_157_cast_fp16)[name = tensor("input_159_cast_fp16")]; tensor var_3585 = const()[name = tensor("op_3585"), val = tensor([1, 1])]; tensor var_3587 = const()[name = tensor("op_3587"), val = tensor([1, 1])]; tensor hidden_states_33_pad_type_0 = const()[name = tensor("hidden_states_33_pad_type_0"), val = tensor("custom")]; tensor hidden_states_33_pad_0 = const()[name = tensor("hidden_states_33_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_15_fc2_weight_to_fp16 = const()[name = tensor("layers_15_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(461374208)))]; tensor layers_15_fc2_bias_to_fp16 = const()[name = tensor("layers_15_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(474481472)))]; tensor hidden_states_33_cast_fp16 = conv(bias = layers_15_fc2_bias_to_fp16, dilations = var_3587, groups = var_3393, pad = hidden_states_33_pad_0, pad_type = hidden_states_33_pad_type_0, strides = var_3585, weight = layers_15_fc2_weight_to_fp16, x = input_159_cast_fp16)[name = tensor("hidden_states_33_cast_fp16")]; tensor inputs_97_cast_fp16 = add(x = inputs_95_cast_fp16, y = hidden_states_33_cast_fp16)[name = tensor("inputs_97_cast_fp16")]; tensor var_3600 = const()[name = tensor("op_3600"), val = tensor(3)]; tensor var_3607 = const()[name = tensor("op_3607"), val = tensor(1)]; tensor var_3608 = const()[name = tensor("op_3608"), val = tensor(true)]; tensor var_3620 = const()[name = tensor("op_3620"), val = tensor([1])]; tensor channels_mean_97_cast_fp16 = reduce_mean(axes = var_3620, keep_dims = var_3608, x = inputs_97_cast_fp16)[name = tensor("channels_mean_97_cast_fp16")]; tensor zero_mean_97_cast_fp16 = sub(x = inputs_97_cast_fp16, y = channels_mean_97_cast_fp16)[name = tensor("zero_mean_97_cast_fp16")]; tensor zero_mean_sq_97_cast_fp16 = mul(x = zero_mean_97_cast_fp16, y = zero_mean_97_cast_fp16)[name = tensor("zero_mean_sq_97_cast_fp16")]; tensor var_3624 = const()[name = tensor("op_3624"), val = tensor([1])]; tensor var_3625_cast_fp16 = reduce_mean(axes = var_3624, keep_dims = var_3608, x = zero_mean_sq_97_cast_fp16)[name = tensor("op_3625_cast_fp16")]; tensor var_3626_to_fp16 = const()[name = tensor("op_3626_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3627_cast_fp16 = add(x = var_3625_cast_fp16, y = var_3626_to_fp16)[name = tensor("op_3627_cast_fp16")]; tensor denom_97_epsilon_0 = const()[name = tensor("denom_97_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_97_cast_fp16 = rsqrt(epsilon = denom_97_epsilon_0, x = var_3627_cast_fp16)[name = tensor("denom_97_cast_fp16")]; tensor out_97_cast_fp16 = mul(x = zero_mean_97_cast_fp16, y = denom_97_cast_fp16)[name = tensor("out_97_cast_fp16")]; tensor obj_193_gamma_0_to_fp16 = const()[name = tensor("obj_193_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(474484096)))]; tensor obj_193_beta_0_to_fp16 = const()[name = tensor("obj_193_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(474486720)))]; tensor obj_193_epsilon_0_to_fp16 = const()[name = tensor("obj_193_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_193_cast_fp16 = batch_norm(beta = obj_193_beta_0_to_fp16, epsilon = obj_193_epsilon_0_to_fp16, gamma = obj_193_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_97_cast_fp16)[name = tensor("obj_193_cast_fp16")]; tensor var_3642 = const()[name = tensor("op_3642"), val = tensor([1, 1])]; tensor var_3644 = const()[name = tensor("op_3644"), val = tensor([1, 1])]; tensor query_65_pad_type_0 = const()[name = tensor("query_65_pad_type_0"), val = tensor("custom")]; tensor query_65_pad_0 = const()[name = tensor("query_65_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_16_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(474489344))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(475308608))), name = tensor("layers_16_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_16_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_16_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(475308736)))]; tensor query_65_cast_fp16 = conv(bias = layers_16_self_attn_q_proj_bias_to_fp16, dilations = var_3644, groups = var_3607, pad = query_65_pad_0, pad_type = query_65_pad_type_0, strides = var_3642, weight = layers_16_self_attn_q_proj_weight_to_fp16_palettized, x = obj_193_cast_fp16)[name = tensor("query_65_cast_fp16")]; tensor var_3648 = const()[name = tensor("op_3648"), val = tensor([1, 1])]; tensor var_3650 = const()[name = tensor("op_3650"), val = tensor([1, 1])]; tensor current_key_33_pad_type_0 = const()[name = tensor("current_key_33_pad_type_0"), val = tensor("custom")]; tensor current_key_33_pad_0 = const()[name = tensor("current_key_33_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_16_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(475311360))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(476540224))), name = tensor("layers_16_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_33_cast_fp16 = conv(dilations = var_3650, groups = var_3607, pad = current_key_33_pad_0, pad_type = current_key_33_pad_type_0, strides = var_3648, weight = layers_16_self_attn_k_proj_weight_to_fp16_palettized, x = obj_193_cast_fp16)[name = tensor("current_key_33_cast_fp16")]; tensor var_3655 = const()[name = tensor("op_3655"), val = tensor([1, 1])]; tensor var_3657 = const()[name = tensor("op_3657"), val = tensor([1, 1])]; tensor current_value_33_pad_type_0 = const()[name = tensor("current_value_33_pad_type_0"), val = tensor("custom")]; tensor current_value_33_pad_0 = const()[name = tensor("current_value_33_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_16_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(476540416))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(477359680))), name = tensor("layers_16_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_16_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_16_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(477359808)))]; tensor current_value_33_cast_fp16 = conv(bias = layers_16_self_attn_v_proj_bias_to_fp16, dilations = var_3657, groups = var_3607, pad = current_value_33_pad_0, pad_type = current_value_33_pad_type_0, strides = var_3655, weight = layers_16_self_attn_v_proj_weight_to_fp16_palettized, x = obj_193_cast_fp16)[name = tensor("current_value_33_cast_fp16")]; tensor var_3664_cast_fp16 = mul(x = current_key_33_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_3664_cast_fp16")]; tensor var_3666_cast_fp16 = mul(x = var_103_cast_fp16_16, y = var_241_cast_fp16)[name = tensor("op_3666_cast_fp16")]; tensor key_65_cast_fp16 = add(x = var_3664_cast_fp16, y = var_3666_cast_fp16)[name = tensor("key_65_cast_fp16")]; tensor var_3668_cast_fp16 = mul(x = current_value_33_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_3668_cast_fp16")]; tensor var_3670_cast_fp16 = mul(x = var_138_cast_fp16_16, y = var_241_cast_fp16)[name = tensor("op_3670_cast_fp16")]; tensor value_65_cast_fp16 = add(x = var_3668_cast_fp16, y = var_3670_cast_fp16)[name = tensor("value_65_cast_fp16")]; tensor var_3673 = const()[name = tensor("op_3673"), val = tensor([1, 20, 64, -1])]; tensor var_3674_cast_fp16 = reshape(shape = var_3673, x = query_65_cast_fp16)[name = tensor("op_3674_cast_fp16")]; tensor var_3675_to_fp16 = const()[name = tensor("op_3675_to_fp16"), val = tensor(0x1p-3)]; tensor var_3676_cast_fp16 = mul(x = var_3674_cast_fp16, y = var_3675_to_fp16)[name = tensor("op_3676_cast_fp16")]; tensor var_3677 = const()[name = tensor("op_3677"), val = tensor([1, 20, 64, -1])]; tensor var_3678_cast_fp16 = reshape(shape = var_3677, x = key_65_cast_fp16)[name = tensor("op_3678_cast_fp16")]; tensor mh_w_97_transpose_x_0 = const()[name = tensor("mh_w_97_transpose_x_0"), val = tensor(true)]; tensor mh_w_97_transpose_y_0 = const()[name = tensor("mh_w_97_transpose_y_0"), val = tensor(false)]; tensor mh_w_97_cast_fp16 = matmul(transpose_x = mh_w_97_transpose_x_0, transpose_y = mh_w_97_transpose_y_0, x = var_3676_cast_fp16, y = var_3678_cast_fp16)[name = tensor("mh_w_97_cast_fp16")]; tensor mh_w_99_cast_fp16 = add(x = mh_w_97_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_99_cast_fp16")]; tensor var_3686_cast_fp16 = softmax(axis = var_3600, x = mh_w_99_cast_fp16)[name = tensor("op_3686_cast_fp16")]; tensor var_3687 = const()[name = tensor("op_3687"), val = tensor([1, 20, 64, -1])]; tensor var_3688_cast_fp16 = reshape(shape = var_3687, x = value_65_cast_fp16)[name = tensor("op_3688_cast_fp16")]; tensor attn_65_transpose_x_0 = const()[name = tensor("attn_65_transpose_x_0"), val = tensor(false)]; tensor attn_65_transpose_y_0 = const()[name = tensor("attn_65_transpose_y_0"), val = tensor(true)]; tensor attn_65_cast_fp16 = matmul(transpose_x = attn_65_transpose_x_0, transpose_y = attn_65_transpose_y_0, x = var_3688_cast_fp16, y = var_3686_cast_fp16)[name = tensor("attn_65_cast_fp16")]; tensor var_3691 = const()[name = tensor("op_3691"), val = tensor([1, 1280, 1, -1])]; tensor input_161_cast_fp16 = reshape(shape = var_3691, x = attn_65_cast_fp16)[name = tensor("input_161_cast_fp16")]; tensor var_3695 = const()[name = tensor("op_3695"), val = tensor([1, 1])]; tensor var_3697 = const()[name = tensor("op_3697"), val = tensor([1, 1])]; tensor obj_199_pad_type_0 = const()[name = tensor("obj_199_pad_type_0"), val = tensor("custom")]; tensor obj_199_pad_0 = const()[name = tensor("obj_199_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_16_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(477362432))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478591296))), name = tensor("layers_16_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_16_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_16_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478591488)))]; tensor obj_199_cast_fp16 = conv(bias = layers_16_self_attn_o_proj_bias_to_fp16, dilations = var_3697, groups = var_3607, pad = obj_199_pad_0, pad_type = obj_199_pad_type_0, strides = var_3695, weight = layers_16_self_attn_o_proj_weight_to_fp16_palettized, x = input_161_cast_fp16)[name = tensor("obj_199_cast_fp16")]; tensor inputs_99_cast_fp16 = add(x = inputs_97_cast_fp16, y = obj_199_cast_fp16)[name = tensor("inputs_99_cast_fp16")]; tensor var_3707 = const()[name = tensor("op_3707"), val = tensor([1])]; tensor channels_mean_99_cast_fp16 = reduce_mean(axes = var_3707, keep_dims = var_3608, x = inputs_99_cast_fp16)[name = tensor("channels_mean_99_cast_fp16")]; tensor zero_mean_99_cast_fp16 = sub(x = inputs_99_cast_fp16, y = channels_mean_99_cast_fp16)[name = tensor("zero_mean_99_cast_fp16")]; tensor zero_mean_sq_99_cast_fp16 = mul(x = zero_mean_99_cast_fp16, y = zero_mean_99_cast_fp16)[name = tensor("zero_mean_sq_99_cast_fp16")]; tensor var_3711 = const()[name = tensor("op_3711"), val = tensor([1])]; tensor var_3712_cast_fp16 = reduce_mean(axes = var_3711, keep_dims = var_3608, x = zero_mean_sq_99_cast_fp16)[name = tensor("op_3712_cast_fp16")]; tensor var_3713_to_fp16 = const()[name = tensor("op_3713_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3714_cast_fp16 = add(x = var_3712_cast_fp16, y = var_3713_to_fp16)[name = tensor("op_3714_cast_fp16")]; tensor denom_99_epsilon_0 = const()[name = tensor("denom_99_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_99_cast_fp16 = rsqrt(epsilon = denom_99_epsilon_0, x = var_3714_cast_fp16)[name = tensor("denom_99_cast_fp16")]; tensor out_99_cast_fp16 = mul(x = zero_mean_99_cast_fp16, y = denom_99_cast_fp16)[name = tensor("out_99_cast_fp16")]; tensor obj_201_gamma_0_to_fp16 = const()[name = tensor("obj_201_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478594112)))]; tensor obj_201_beta_0_to_fp16 = const()[name = tensor("obj_201_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478596736)))]; tensor obj_201_epsilon_0_to_fp16 = const()[name = tensor("obj_201_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_201_cast_fp16 = batch_norm(beta = obj_201_beta_0_to_fp16, epsilon = obj_201_epsilon_0_to_fp16, gamma = obj_201_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_99_cast_fp16)[name = tensor("obj_201_cast_fp16")]; tensor var_3729 = const()[name = tensor("op_3729"), val = tensor([1, 1])]; tensor var_3731 = const()[name = tensor("op_3731"), val = tensor([1, 1])]; tensor query_67_pad_type_0 = const()[name = tensor("query_67_pad_type_0"), val = tensor("custom")]; tensor query_67_pad_0 = const()[name = tensor("query_67_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_16_encoder_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_16_encoder_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478599360)))]; tensor layers_16_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_16_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(481876224)))]; tensor query_67_cast_fp16 = conv(bias = layers_16_encoder_attn_q_proj_bias_to_fp16, dilations = var_3731, groups = var_3607, pad = query_67_pad_0, pad_type = query_67_pad_type_0, strides = var_3729, weight = layers_16_encoder_attn_q_proj_weight_to_fp16, x = obj_201_cast_fp16)[name = tensor("query_67_cast_fp16")]; tensor var_3735 = const()[name = tensor("op_3735"), val = tensor([1, 1])]; tensor var_3737 = const()[name = tensor("op_3737"), val = tensor([1, 1])]; tensor key_67_pad_type_0 = const()[name = tensor("key_67_pad_type_0"), val = tensor("custom")]; tensor key_67_pad_0 = const()[name = tensor("key_67_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_16_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(481878848))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(483517312))), name = tensor("layers_16_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_67_cast_fp16 = conv(dilations = var_3737, groups = var_3607, pad = key_67_pad_0, pad_type = key_67_pad_type_0, strides = var_3735, weight = layers_16_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_67_cast_fp16")]; tensor var_3742 = const()[name = tensor("op_3742"), val = tensor([1, 1])]; tensor var_3744 = const()[name = tensor("op_3744"), val = tensor([1, 1])]; tensor value_67_pad_type_0 = const()[name = tensor("value_67_pad_type_0"), val = tensor("custom")]; tensor value_67_pad_0 = const()[name = tensor("value_67_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_16_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(483517888))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(484746752))), name = tensor("layers_16_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_16_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_16_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(484746944)))]; tensor value_67_cast_fp16 = conv(bias = layers_16_encoder_attn_v_proj_bias_to_fp16, dilations = var_3744, groups = var_3607, pad = value_67_pad_0, pad_type = value_67_pad_type_0, strides = var_3742, weight = layers_16_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_67_cast_fp16")]; tensor var_3748 = const()[name = tensor("op_3748"), val = tensor([1, 20, 64, -1])]; tensor var_3749_cast_fp16 = reshape(shape = var_3748, x = query_67_cast_fp16)[name = tensor("op_3749_cast_fp16")]; tensor var_3750_to_fp16 = const()[name = tensor("op_3750_to_fp16"), val = tensor(0x1p-3)]; tensor var_3751_cast_fp16 = mul(x = var_3749_cast_fp16, y = var_3750_to_fp16)[name = tensor("op_3751_cast_fp16")]; tensor var_3752 = const()[name = tensor("op_3752"), val = tensor([1, 20, 64, -1])]; tensor var_3753_cast_fp16 = reshape(shape = var_3752, x = key_67_cast_fp16)[name = tensor("op_3753_cast_fp16")]; tensor mh_w_101_transpose_x_0 = const()[name = tensor("mh_w_101_transpose_x_0"), val = tensor(true)]; tensor mh_w_101_transpose_y_0 = const()[name = tensor("mh_w_101_transpose_y_0"), val = tensor(false)]; tensor mh_w_101_cast_fp16 = matmul(transpose_x = mh_w_101_transpose_x_0, transpose_y = mh_w_101_transpose_y_0, x = var_3751_cast_fp16, y = var_3753_cast_fp16)[name = tensor("mh_w_101_cast_fp16")]; tensor var_3756_cast_fp16 = softmax(axis = var_3600, x = mh_w_101_cast_fp16)[name = tensor("op_3756_cast_fp16")]; tensor var_3757 = const()[name = tensor("op_3757"), val = tensor([1, 20, 64, -1])]; tensor var_3758_cast_fp16 = reshape(shape = var_3757, x = value_67_cast_fp16)[name = tensor("op_3758_cast_fp16")]; tensor attn_67_transpose_x_0 = const()[name = tensor("attn_67_transpose_x_0"), val = tensor(false)]; tensor attn_67_transpose_y_0 = const()[name = tensor("attn_67_transpose_y_0"), val = tensor(true)]; tensor attn_67_cast_fp16 = matmul(transpose_x = attn_67_transpose_x_0, transpose_y = attn_67_transpose_y_0, x = var_3758_cast_fp16, y = var_3756_cast_fp16)[name = tensor("attn_67_cast_fp16")]; tensor var_3761 = const()[name = tensor("op_3761"), val = tensor([1, 1280, 1, -1])]; tensor input_163_cast_fp16 = reshape(shape = var_3761, x = attn_67_cast_fp16)[name = tensor("input_163_cast_fp16")]; tensor var_3765 = const()[name = tensor("op_3765"), val = tensor([1, 1])]; tensor var_3767 = const()[name = tensor("op_3767"), val = tensor([1, 1])]; tensor obj_203_pad_type_0 = const()[name = tensor("obj_203_pad_type_0"), val = tensor("custom")]; tensor obj_203_pad_0 = const()[name = tensor("obj_203_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_16_encoder_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_16_encoder_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(484749568)))]; tensor layers_16_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_16_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488026432)))]; tensor obj_203_cast_fp16 = conv(bias = layers_16_encoder_attn_o_proj_bias_to_fp16, dilations = var_3767, groups = var_3607, pad = obj_203_pad_0, pad_type = obj_203_pad_type_0, strides = var_3765, weight = layers_16_encoder_attn_o_proj_weight_to_fp16, x = input_163_cast_fp16)[name = tensor("obj_203_cast_fp16")]; tensor inputs_101_cast_fp16 = add(x = inputs_99_cast_fp16, y = obj_203_cast_fp16)[name = tensor("inputs_101_cast_fp16")]; tensor var_3773 = const()[name = tensor("op_3773"), val = tensor([1])]; tensor channels_mean_101_cast_fp16 = reduce_mean(axes = var_3773, keep_dims = var_3608, x = inputs_101_cast_fp16)[name = tensor("channels_mean_101_cast_fp16")]; tensor zero_mean_101_cast_fp16 = sub(x = inputs_101_cast_fp16, y = channels_mean_101_cast_fp16)[name = tensor("zero_mean_101_cast_fp16")]; tensor zero_mean_sq_101_cast_fp16 = mul(x = zero_mean_101_cast_fp16, y = zero_mean_101_cast_fp16)[name = tensor("zero_mean_sq_101_cast_fp16")]; tensor var_3777 = const()[name = tensor("op_3777"), val = tensor([1])]; tensor var_3778_cast_fp16 = reduce_mean(axes = var_3777, keep_dims = var_3608, x = zero_mean_sq_101_cast_fp16)[name = tensor("op_3778_cast_fp16")]; tensor var_3779_to_fp16 = const()[name = tensor("op_3779_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3780_cast_fp16 = add(x = var_3778_cast_fp16, y = var_3779_to_fp16)[name = tensor("op_3780_cast_fp16")]; tensor denom_101_epsilon_0 = const()[name = tensor("denom_101_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_101_cast_fp16 = rsqrt(epsilon = denom_101_epsilon_0, x = var_3780_cast_fp16)[name = tensor("denom_101_cast_fp16")]; tensor out_101_cast_fp16 = mul(x = zero_mean_101_cast_fp16, y = denom_101_cast_fp16)[name = tensor("out_101_cast_fp16")]; tensor input_165_gamma_0_to_fp16 = const()[name = tensor("input_165_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488029056)))]; tensor input_165_beta_0_to_fp16 = const()[name = tensor("input_165_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488031680)))]; tensor input_165_epsilon_0_to_fp16 = const()[name = tensor("input_165_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_165_cast_fp16 = batch_norm(beta = input_165_beta_0_to_fp16, epsilon = input_165_epsilon_0_to_fp16, gamma = input_165_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_101_cast_fp16)[name = tensor("input_165_cast_fp16")]; tensor var_3791 = const()[name = tensor("op_3791"), val = tensor([1, 1])]; tensor var_3793 = const()[name = tensor("op_3793"), val = tensor([1, 1])]; tensor input_167_pad_type_0 = const()[name = tensor("input_167_pad_type_0"), val = tensor("custom")]; tensor input_167_pad_0 = const()[name = tensor("input_167_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_16_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488034304))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492949568))), name = tensor("layers_16_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_16_fc1_bias_to_fp16 = const()[name = tensor("layers_16_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492949760)))]; tensor input_167_cast_fp16 = conv(bias = layers_16_fc1_bias_to_fp16, dilations = var_3793, groups = var_3607, pad = input_167_pad_0, pad_type = input_167_pad_type_0, strides = var_3791, weight = layers_16_fc1_weight_to_fp16_palettized, x = input_165_cast_fp16)[name = tensor("input_167_cast_fp16")]; tensor input_169_mode_0 = const()[name = tensor("input_169_mode_0"), val = tensor("EXACT")]; tensor input_169_cast_fp16 = gelu(mode = input_169_mode_0, x = input_167_cast_fp16)[name = tensor("input_169_cast_fp16")]; tensor var_3799 = const()[name = tensor("op_3799"), val = tensor([1, 1])]; tensor var_3801 = const()[name = tensor("op_3801"), val = tensor([1, 1])]; tensor hidden_states_35_pad_type_0 = const()[name = tensor("hidden_states_35_pad_type_0"), val = tensor("custom")]; tensor hidden_states_35_pad_0 = const()[name = tensor("hidden_states_35_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_16_fc2_weight_to_fp16 = const()[name = tensor("layers_16_fc2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492960064)))]; tensor layers_16_fc2_bias_to_fp16 = const()[name = tensor("layers_16_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(506067328)))]; tensor hidden_states_35_cast_fp16 = conv(bias = layers_16_fc2_bias_to_fp16, dilations = var_3801, groups = var_3607, pad = hidden_states_35_pad_0, pad_type = hidden_states_35_pad_type_0, strides = var_3799, weight = layers_16_fc2_weight_to_fp16, x = input_169_cast_fp16)[name = tensor("hidden_states_35_cast_fp16")]; tensor inputs_103_cast_fp16 = add(x = inputs_101_cast_fp16, y = hidden_states_35_cast_fp16)[name = tensor("inputs_103_cast_fp16")]; tensor var_3814 = const()[name = tensor("op_3814"), val = tensor(3)]; tensor var_3821 = const()[name = tensor("op_3821"), val = tensor(1)]; tensor var_3822 = const()[name = tensor("op_3822"), val = tensor(true)]; tensor var_3834 = const()[name = tensor("op_3834"), val = tensor([1])]; tensor channels_mean_103_cast_fp16 = reduce_mean(axes = var_3834, keep_dims = var_3822, x = inputs_103_cast_fp16)[name = tensor("channels_mean_103_cast_fp16")]; tensor zero_mean_103_cast_fp16 = sub(x = inputs_103_cast_fp16, y = channels_mean_103_cast_fp16)[name = tensor("zero_mean_103_cast_fp16")]; tensor zero_mean_sq_103_cast_fp16 = mul(x = zero_mean_103_cast_fp16, y = zero_mean_103_cast_fp16)[name = tensor("zero_mean_sq_103_cast_fp16")]; tensor var_3838 = const()[name = tensor("op_3838"), val = tensor([1])]; tensor var_3839_cast_fp16 = reduce_mean(axes = var_3838, keep_dims = var_3822, x = zero_mean_sq_103_cast_fp16)[name = tensor("op_3839_cast_fp16")]; tensor var_3840_to_fp16 = const()[name = tensor("op_3840_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3841_cast_fp16 = add(x = var_3839_cast_fp16, y = var_3840_to_fp16)[name = tensor("op_3841_cast_fp16")]; tensor denom_103_epsilon_0 = const()[name = tensor("denom_103_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_103_cast_fp16 = rsqrt(epsilon = denom_103_epsilon_0, x = var_3841_cast_fp16)[name = tensor("denom_103_cast_fp16")]; tensor out_103_cast_fp16 = mul(x = zero_mean_103_cast_fp16, y = denom_103_cast_fp16)[name = tensor("out_103_cast_fp16")]; tensor obj_205_gamma_0_to_fp16 = const()[name = tensor("obj_205_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(506069952)))]; tensor obj_205_beta_0_to_fp16 = const()[name = tensor("obj_205_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(506072576)))]; tensor obj_205_epsilon_0_to_fp16 = const()[name = tensor("obj_205_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_205_cast_fp16 = batch_norm(beta = obj_205_beta_0_to_fp16, epsilon = obj_205_epsilon_0_to_fp16, gamma = obj_205_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_103_cast_fp16)[name = tensor("obj_205_cast_fp16")]; tensor var_3856 = const()[name = tensor("op_3856"), val = tensor([1, 1])]; tensor var_3858 = const()[name = tensor("op_3858"), val = tensor([1, 1])]; tensor query_69_pad_type_0 = const()[name = tensor("query_69_pad_type_0"), val = tensor("custom")]; tensor query_69_pad_0 = const()[name = tensor("query_69_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_17_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(506075200))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(507304064))), name = tensor("layers_17_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_17_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_17_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(507304256)))]; tensor query_69_cast_fp16 = conv(bias = layers_17_self_attn_q_proj_bias_to_fp16, dilations = var_3858, groups = var_3821, pad = query_69_pad_0, pad_type = query_69_pad_type_0, strides = var_3856, weight = layers_17_self_attn_q_proj_weight_to_fp16_palettized, x = obj_205_cast_fp16)[name = tensor("query_69_cast_fp16")]; tensor var_3862 = const()[name = tensor("op_3862"), val = tensor([1, 1])]; tensor var_3864 = const()[name = tensor("op_3864"), val = tensor([1, 1])]; tensor current_key_35_pad_type_0 = const()[name = tensor("current_key_35_pad_type_0"), val = tensor("custom")]; tensor current_key_35_pad_0 = const()[name = tensor("current_key_35_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_17_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(507306880))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(508126144))), name = tensor("layers_17_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_35_cast_fp16 = conv(dilations = var_3864, groups = var_3821, pad = current_key_35_pad_0, pad_type = current_key_35_pad_type_0, strides = var_3862, weight = layers_17_self_attn_k_proj_weight_to_fp16_palettized, x = obj_205_cast_fp16)[name = tensor("current_key_35_cast_fp16")]; tensor var_3869 = const()[name = tensor("op_3869"), val = tensor([1, 1])]; tensor var_3871 = const()[name = tensor("op_3871"), val = tensor([1, 1])]; tensor current_value_35_pad_type_0 = const()[name = tensor("current_value_35_pad_type_0"), val = tensor("custom")]; tensor current_value_35_pad_0 = const()[name = tensor("current_value_35_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_17_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(508126272))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(508945536))), name = tensor("layers_17_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_17_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_17_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(508945664)))]; tensor current_value_35_cast_fp16 = conv(bias = layers_17_self_attn_v_proj_bias_to_fp16, dilations = var_3871, groups = var_3821, pad = current_value_35_pad_0, pad_type = current_value_35_pad_type_0, strides = var_3869, weight = layers_17_self_attn_v_proj_weight_to_fp16_palettized, x = obj_205_cast_fp16)[name = tensor("current_value_35_cast_fp16")]; tensor var_3878_cast_fp16 = mul(x = current_key_35_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_3878_cast_fp16")]; tensor var_3880_cast_fp16 = mul(x = var_103_cast_fp16_17, y = var_241_cast_fp16)[name = tensor("op_3880_cast_fp16")]; tensor key_69_cast_fp16 = add(x = var_3878_cast_fp16, y = var_3880_cast_fp16)[name = tensor("key_69_cast_fp16")]; tensor var_3882_cast_fp16 = mul(x = current_value_35_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_3882_cast_fp16")]; tensor var_3884_cast_fp16 = mul(x = var_138_cast_fp16_17, y = var_241_cast_fp16)[name = tensor("op_3884_cast_fp16")]; tensor value_69_cast_fp16 = add(x = var_3882_cast_fp16, y = var_3884_cast_fp16)[name = tensor("value_69_cast_fp16")]; tensor var_3887 = const()[name = tensor("op_3887"), val = tensor([1, 20, 64, -1])]; tensor var_3888_cast_fp16 = reshape(shape = var_3887, x = query_69_cast_fp16)[name = tensor("op_3888_cast_fp16")]; tensor var_3889_to_fp16 = const()[name = tensor("op_3889_to_fp16"), val = tensor(0x1p-3)]; tensor var_3890_cast_fp16 = mul(x = var_3888_cast_fp16, y = var_3889_to_fp16)[name = tensor("op_3890_cast_fp16")]; tensor var_3891 = const()[name = tensor("op_3891"), val = tensor([1, 20, 64, -1])]; tensor var_3892_cast_fp16 = reshape(shape = var_3891, x = key_69_cast_fp16)[name = tensor("op_3892_cast_fp16")]; tensor mh_w_103_transpose_x_0 = const()[name = tensor("mh_w_103_transpose_x_0"), val = tensor(true)]; tensor mh_w_103_transpose_y_0 = const()[name = tensor("mh_w_103_transpose_y_0"), val = tensor(false)]; tensor mh_w_103_cast_fp16 = matmul(transpose_x = mh_w_103_transpose_x_0, transpose_y = mh_w_103_transpose_y_0, x = var_3890_cast_fp16, y = var_3892_cast_fp16)[name = tensor("mh_w_103_cast_fp16")]; tensor mh_w_105_cast_fp16 = add(x = mh_w_103_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_105_cast_fp16")]; tensor var_3900_cast_fp16 = softmax(axis = var_3814, x = mh_w_105_cast_fp16)[name = tensor("op_3900_cast_fp16")]; tensor var_3901 = const()[name = tensor("op_3901"), val = tensor([1, 20, 64, -1])]; tensor var_3902_cast_fp16 = reshape(shape = var_3901, x = value_69_cast_fp16)[name = tensor("op_3902_cast_fp16")]; tensor attn_69_transpose_x_0 = const()[name = tensor("attn_69_transpose_x_0"), val = tensor(false)]; tensor attn_69_transpose_y_0 = const()[name = tensor("attn_69_transpose_y_0"), val = tensor(true)]; tensor attn_69_cast_fp16 = matmul(transpose_x = attn_69_transpose_x_0, transpose_y = attn_69_transpose_y_0, x = var_3902_cast_fp16, y = var_3900_cast_fp16)[name = tensor("attn_69_cast_fp16")]; tensor var_3905 = const()[name = tensor("op_3905"), val = tensor([1, 1280, 1, -1])]; tensor input_171_cast_fp16 = reshape(shape = var_3905, x = attn_69_cast_fp16)[name = tensor("input_171_cast_fp16")]; tensor var_3909 = const()[name = tensor("op_3909"), val = tensor([1, 1])]; tensor var_3911 = const()[name = tensor("op_3911"), val = tensor([1, 1])]; tensor obj_211_pad_type_0 = const()[name = tensor("obj_211_pad_type_0"), val = tensor("custom")]; tensor obj_211_pad_0 = const()[name = tensor("obj_211_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_17_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(508948288))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(509767552))), name = tensor("layers_17_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_17_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_17_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(509767680)))]; tensor obj_211_cast_fp16 = conv(bias = layers_17_self_attn_o_proj_bias_to_fp16, dilations = var_3911, groups = var_3821, pad = obj_211_pad_0, pad_type = obj_211_pad_type_0, strides = var_3909, weight = layers_17_self_attn_o_proj_weight_to_fp16_palettized, x = input_171_cast_fp16)[name = tensor("obj_211_cast_fp16")]; tensor inputs_105_cast_fp16 = add(x = inputs_103_cast_fp16, y = obj_211_cast_fp16)[name = tensor("inputs_105_cast_fp16")]; tensor var_3921 = const()[name = tensor("op_3921"), val = tensor([1])]; tensor channels_mean_105_cast_fp16 = reduce_mean(axes = var_3921, keep_dims = var_3822, x = inputs_105_cast_fp16)[name = tensor("channels_mean_105_cast_fp16")]; tensor zero_mean_105_cast_fp16 = sub(x = inputs_105_cast_fp16, y = channels_mean_105_cast_fp16)[name = tensor("zero_mean_105_cast_fp16")]; tensor zero_mean_sq_105_cast_fp16 = mul(x = zero_mean_105_cast_fp16, y = zero_mean_105_cast_fp16)[name = tensor("zero_mean_sq_105_cast_fp16")]; tensor var_3925 = const()[name = tensor("op_3925"), val = tensor([1])]; tensor var_3926_cast_fp16 = reduce_mean(axes = var_3925, keep_dims = var_3822, x = zero_mean_sq_105_cast_fp16)[name = tensor("op_3926_cast_fp16")]; tensor var_3927_to_fp16 = const()[name = tensor("op_3927_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3928_cast_fp16 = add(x = var_3926_cast_fp16, y = var_3927_to_fp16)[name = tensor("op_3928_cast_fp16")]; tensor denom_105_epsilon_0 = const()[name = tensor("denom_105_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_105_cast_fp16 = rsqrt(epsilon = denom_105_epsilon_0, x = var_3928_cast_fp16)[name = tensor("denom_105_cast_fp16")]; tensor out_105_cast_fp16 = mul(x = zero_mean_105_cast_fp16, y = denom_105_cast_fp16)[name = tensor("out_105_cast_fp16")]; tensor obj_213_gamma_0_to_fp16 = const()[name = tensor("obj_213_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(509770304)))]; tensor obj_213_beta_0_to_fp16 = const()[name = tensor("obj_213_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(509772928)))]; tensor obj_213_epsilon_0_to_fp16 = const()[name = tensor("obj_213_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_213_cast_fp16 = batch_norm(beta = obj_213_beta_0_to_fp16, epsilon = obj_213_epsilon_0_to_fp16, gamma = obj_213_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_105_cast_fp16)[name = tensor("obj_213_cast_fp16")]; tensor var_3943 = const()[name = tensor("op_3943"), val = tensor([1, 1])]; tensor var_3945 = const()[name = tensor("op_3945"), val = tensor([1, 1])]; tensor query_71_pad_type_0 = const()[name = tensor("query_71_pad_type_0"), val = tensor("custom")]; tensor query_71_pad_0 = const()[name = tensor("query_71_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_17_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(509775552))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(511004416))), name = tensor("layers_17_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_17_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_17_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(511004608)))]; tensor query_71_cast_fp16 = conv(bias = layers_17_encoder_attn_q_proj_bias_to_fp16, dilations = var_3945, groups = var_3821, pad = query_71_pad_0, pad_type = query_71_pad_type_0, strides = var_3943, weight = layers_17_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_213_cast_fp16)[name = tensor("query_71_cast_fp16")]; tensor var_3949 = const()[name = tensor("op_3949"), val = tensor([1, 1])]; tensor var_3951 = const()[name = tensor("op_3951"), val = tensor([1, 1])]; tensor key_71_pad_type_0 = const()[name = tensor("key_71_pad_type_0"), val = tensor("custom")]; tensor key_71_pad_0 = const()[name = tensor("key_71_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_17_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(511007232))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(511826496))), name = tensor("layers_17_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_71_cast_fp16 = conv(dilations = var_3951, groups = var_3821, pad = key_71_pad_0, pad_type = key_71_pad_type_0, strides = var_3949, weight = layers_17_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_71_cast_fp16")]; tensor var_3956 = const()[name = tensor("op_3956"), val = tensor([1, 1])]; tensor var_3958 = const()[name = tensor("op_3958"), val = tensor([1, 1])]; tensor value_71_pad_type_0 = const()[name = tensor("value_71_pad_type_0"), val = tensor("custom")]; tensor value_71_pad_0 = const()[name = tensor("value_71_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_17_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(511826624))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513465088))), name = tensor("layers_17_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_17_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_17_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513465664)))]; tensor value_71_cast_fp16 = conv(bias = layers_17_encoder_attn_v_proj_bias_to_fp16, dilations = var_3958, groups = var_3821, pad = value_71_pad_0, pad_type = value_71_pad_type_0, strides = var_3956, weight = layers_17_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_71_cast_fp16")]; tensor var_3962 = const()[name = tensor("op_3962"), val = tensor([1, 20, 64, -1])]; tensor var_3963_cast_fp16 = reshape(shape = var_3962, x = query_71_cast_fp16)[name = tensor("op_3963_cast_fp16")]; tensor var_3964_to_fp16 = const()[name = tensor("op_3964_to_fp16"), val = tensor(0x1p-3)]; tensor var_3965_cast_fp16 = mul(x = var_3963_cast_fp16, y = var_3964_to_fp16)[name = tensor("op_3965_cast_fp16")]; tensor var_3966 = const()[name = tensor("op_3966"), val = tensor([1, 20, 64, -1])]; tensor var_3967_cast_fp16 = reshape(shape = var_3966, x = key_71_cast_fp16)[name = tensor("op_3967_cast_fp16")]; tensor mh_w_107_transpose_x_0 = const()[name = tensor("mh_w_107_transpose_x_0"), val = tensor(true)]; tensor mh_w_107_transpose_y_0 = const()[name = tensor("mh_w_107_transpose_y_0"), val = tensor(false)]; tensor mh_w_107_cast_fp16 = matmul(transpose_x = mh_w_107_transpose_x_0, transpose_y = mh_w_107_transpose_y_0, x = var_3965_cast_fp16, y = var_3967_cast_fp16)[name = tensor("mh_w_107_cast_fp16")]; tensor var_3970_cast_fp16 = softmax(axis = var_3814, x = mh_w_107_cast_fp16)[name = tensor("op_3970_cast_fp16")]; tensor var_3971 = const()[name = tensor("op_3971"), val = tensor([1, 20, 64, -1])]; tensor var_3972_cast_fp16 = reshape(shape = var_3971, x = value_71_cast_fp16)[name = tensor("op_3972_cast_fp16")]; tensor attn_71_transpose_x_0 = const()[name = tensor("attn_71_transpose_x_0"), val = tensor(false)]; tensor attn_71_transpose_y_0 = const()[name = tensor("attn_71_transpose_y_0"), val = tensor(true)]; tensor attn_71_cast_fp16 = matmul(transpose_x = attn_71_transpose_x_0, transpose_y = attn_71_transpose_y_0, x = var_3972_cast_fp16, y = var_3970_cast_fp16)[name = tensor("attn_71_cast_fp16")]; tensor var_3975 = const()[name = tensor("op_3975"), val = tensor([1, 1280, 1, -1])]; tensor input_173_cast_fp16 = reshape(shape = var_3975, x = attn_71_cast_fp16)[name = tensor("input_173_cast_fp16")]; tensor var_3979 = const()[name = tensor("op_3979"), val = tensor([1, 1])]; tensor var_3981 = const()[name = tensor("op_3981"), val = tensor([1, 1])]; tensor obj_215_pad_type_0 = const()[name = tensor("obj_215_pad_type_0"), val = tensor("custom")]; tensor obj_215_pad_0 = const()[name = tensor("obj_215_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_17_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513468288))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(515106752))), name = tensor("layers_17_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_17_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_17_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(515107328)))]; tensor obj_215_cast_fp16 = conv(bias = layers_17_encoder_attn_o_proj_bias_to_fp16, dilations = var_3981, groups = var_3821, pad = obj_215_pad_0, pad_type = obj_215_pad_type_0, strides = var_3979, weight = layers_17_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_173_cast_fp16)[name = tensor("obj_215_cast_fp16")]; tensor inputs_107_cast_fp16 = add(x = inputs_105_cast_fp16, y = obj_215_cast_fp16)[name = tensor("inputs_107_cast_fp16")]; tensor var_3987 = const()[name = tensor("op_3987"), val = tensor([1])]; tensor channels_mean_107_cast_fp16 = reduce_mean(axes = var_3987, keep_dims = var_3822, x = inputs_107_cast_fp16)[name = tensor("channels_mean_107_cast_fp16")]; tensor zero_mean_107_cast_fp16 = sub(x = inputs_107_cast_fp16, y = channels_mean_107_cast_fp16)[name = tensor("zero_mean_107_cast_fp16")]; tensor zero_mean_sq_107_cast_fp16 = mul(x = zero_mean_107_cast_fp16, y = zero_mean_107_cast_fp16)[name = tensor("zero_mean_sq_107_cast_fp16")]; tensor var_3991 = const()[name = tensor("op_3991"), val = tensor([1])]; tensor var_3992_cast_fp16 = reduce_mean(axes = var_3991, keep_dims = var_3822, x = zero_mean_sq_107_cast_fp16)[name = tensor("op_3992_cast_fp16")]; tensor var_3993_to_fp16 = const()[name = tensor("op_3993_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3994_cast_fp16 = add(x = var_3992_cast_fp16, y = var_3993_to_fp16)[name = tensor("op_3994_cast_fp16")]; tensor denom_107_epsilon_0 = const()[name = tensor("denom_107_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_107_cast_fp16 = rsqrt(epsilon = denom_107_epsilon_0, x = var_3994_cast_fp16)[name = tensor("denom_107_cast_fp16")]; tensor out_107_cast_fp16 = mul(x = zero_mean_107_cast_fp16, y = denom_107_cast_fp16)[name = tensor("out_107_cast_fp16")]; tensor input_175_gamma_0_to_fp16 = const()[name = tensor("input_175_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(515109952)))]; tensor input_175_beta_0_to_fp16 = const()[name = tensor("input_175_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(515112576)))]; tensor input_175_epsilon_0_to_fp16 = const()[name = tensor("input_175_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_175_cast_fp16 = batch_norm(beta = input_175_beta_0_to_fp16, epsilon = input_175_epsilon_0_to_fp16, gamma = input_175_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_107_cast_fp16)[name = tensor("input_175_cast_fp16")]; tensor var_4005 = const()[name = tensor("op_4005"), val = tensor([1, 1])]; tensor var_4007 = const()[name = tensor("op_4007"), val = tensor([1, 1])]; tensor input_177_pad_type_0 = const()[name = tensor("input_177_pad_type_0"), val = tensor("custom")]; tensor input_177_pad_0 = const()[name = tensor("input_177_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_17_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(515115200))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(520030464))), name = tensor("layers_17_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_17_fc1_bias_to_fp16 = const()[name = tensor("layers_17_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(520030656)))]; tensor input_177_cast_fp16 = conv(bias = layers_17_fc1_bias_to_fp16, dilations = var_4007, groups = var_3821, pad = input_177_pad_0, pad_type = input_177_pad_type_0, strides = var_4005, weight = layers_17_fc1_weight_to_fp16_palettized, x = input_175_cast_fp16)[name = tensor("input_177_cast_fp16")]; tensor input_179_mode_0 = const()[name = tensor("input_179_mode_0"), val = tensor("EXACT")]; tensor input_179_cast_fp16 = gelu(mode = input_179_mode_0, x = input_177_cast_fp16)[name = tensor("input_179_cast_fp16")]; tensor var_4013 = const()[name = tensor("op_4013"), val = tensor([1, 1])]; tensor var_4015 = const()[name = tensor("op_4015"), val = tensor([1, 1])]; tensor hidden_states_37_pad_type_0 = const()[name = tensor("hidden_states_37_pad_type_0"), val = tensor("custom")]; tensor hidden_states_37_pad_0 = const()[name = tensor("hidden_states_37_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_17_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(520040960))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526594624))), name = tensor("layers_17_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_17_fc2_bias_to_fp16 = const()[name = tensor("layers_17_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526595200)))]; tensor hidden_states_37_cast_fp16 = conv(bias = layers_17_fc2_bias_to_fp16, dilations = var_4015, groups = var_3821, pad = hidden_states_37_pad_0, pad_type = hidden_states_37_pad_type_0, strides = var_4013, weight = layers_17_fc2_weight_to_fp16_palettized, x = input_179_cast_fp16)[name = tensor("hidden_states_37_cast_fp16")]; tensor inputs_109_cast_fp16 = add(x = inputs_107_cast_fp16, y = hidden_states_37_cast_fp16)[name = tensor("inputs_109_cast_fp16")]; tensor var_4028 = const()[name = tensor("op_4028"), val = tensor(3)]; tensor var_4035 = const()[name = tensor("op_4035"), val = tensor(1)]; tensor var_4036 = const()[name = tensor("op_4036"), val = tensor(true)]; tensor var_4048 = const()[name = tensor("op_4048"), val = tensor([1])]; tensor channels_mean_109_cast_fp16 = reduce_mean(axes = var_4048, keep_dims = var_4036, x = inputs_109_cast_fp16)[name = tensor("channels_mean_109_cast_fp16")]; tensor zero_mean_109_cast_fp16 = sub(x = inputs_109_cast_fp16, y = channels_mean_109_cast_fp16)[name = tensor("zero_mean_109_cast_fp16")]; tensor zero_mean_sq_109_cast_fp16 = mul(x = zero_mean_109_cast_fp16, y = zero_mean_109_cast_fp16)[name = tensor("zero_mean_sq_109_cast_fp16")]; tensor var_4052 = const()[name = tensor("op_4052"), val = tensor([1])]; tensor var_4053_cast_fp16 = reduce_mean(axes = var_4052, keep_dims = var_4036, x = zero_mean_sq_109_cast_fp16)[name = tensor("op_4053_cast_fp16")]; tensor var_4054_to_fp16 = const()[name = tensor("op_4054_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4055_cast_fp16 = add(x = var_4053_cast_fp16, y = var_4054_to_fp16)[name = tensor("op_4055_cast_fp16")]; tensor denom_109_epsilon_0 = const()[name = tensor("denom_109_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_109_cast_fp16 = rsqrt(epsilon = denom_109_epsilon_0, x = var_4055_cast_fp16)[name = tensor("denom_109_cast_fp16")]; tensor out_109_cast_fp16 = mul(x = zero_mean_109_cast_fp16, y = denom_109_cast_fp16)[name = tensor("out_109_cast_fp16")]; tensor obj_217_gamma_0_to_fp16 = const()[name = tensor("obj_217_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526597824)))]; tensor obj_217_beta_0_to_fp16 = const()[name = tensor("obj_217_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526600448)))]; tensor obj_217_epsilon_0_to_fp16 = const()[name = tensor("obj_217_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_217_cast_fp16 = batch_norm(beta = obj_217_beta_0_to_fp16, epsilon = obj_217_epsilon_0_to_fp16, gamma = obj_217_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_109_cast_fp16)[name = tensor("obj_217_cast_fp16")]; tensor var_4070 = const()[name = tensor("op_4070"), val = tensor([1, 1])]; tensor var_4072 = const()[name = tensor("op_4072"), val = tensor([1, 1])]; tensor query_73_pad_type_0 = const()[name = tensor("query_73_pad_type_0"), val = tensor("custom")]; tensor query_73_pad_0 = const()[name = tensor("query_73_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_18_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526603072))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(527831936))), name = tensor("layers_18_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_18_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_18_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(527832128)))]; tensor query_73_cast_fp16 = conv(bias = layers_18_self_attn_q_proj_bias_to_fp16, dilations = var_4072, groups = var_4035, pad = query_73_pad_0, pad_type = query_73_pad_type_0, strides = var_4070, weight = layers_18_self_attn_q_proj_weight_to_fp16_palettized, x = obj_217_cast_fp16)[name = tensor("query_73_cast_fp16")]; tensor var_4076 = const()[name = tensor("op_4076"), val = tensor([1, 1])]; tensor var_4078 = const()[name = tensor("op_4078"), val = tensor([1, 1])]; tensor current_key_37_pad_type_0 = const()[name = tensor("current_key_37_pad_type_0"), val = tensor("custom")]; tensor current_key_37_pad_0 = const()[name = tensor("current_key_37_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_18_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(527834752))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(528654016))), name = tensor("layers_18_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_37_cast_fp16 = conv(dilations = var_4078, groups = var_4035, pad = current_key_37_pad_0, pad_type = current_key_37_pad_type_0, strides = var_4076, weight = layers_18_self_attn_k_proj_weight_to_fp16_palettized, x = obj_217_cast_fp16)[name = tensor("current_key_37_cast_fp16")]; tensor var_4083 = const()[name = tensor("op_4083"), val = tensor([1, 1])]; tensor var_4085 = const()[name = tensor("op_4085"), val = tensor([1, 1])]; tensor current_value_37_pad_type_0 = const()[name = tensor("current_value_37_pad_type_0"), val = tensor("custom")]; tensor current_value_37_pad_0 = const()[name = tensor("current_value_37_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_18_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(528654144))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(529473408))), name = tensor("layers_18_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_18_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_18_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(529473536)))]; tensor current_value_37_cast_fp16 = conv(bias = layers_18_self_attn_v_proj_bias_to_fp16, dilations = var_4085, groups = var_4035, pad = current_value_37_pad_0, pad_type = current_value_37_pad_type_0, strides = var_4083, weight = layers_18_self_attn_v_proj_weight_to_fp16_palettized, x = obj_217_cast_fp16)[name = tensor("current_value_37_cast_fp16")]; tensor var_4092_cast_fp16 = mul(x = current_key_37_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_4092_cast_fp16")]; tensor var_4094_cast_fp16 = mul(x = var_103_cast_fp16_18, y = var_241_cast_fp16)[name = tensor("op_4094_cast_fp16")]; tensor key_73_cast_fp16 = add(x = var_4092_cast_fp16, y = var_4094_cast_fp16)[name = tensor("key_73_cast_fp16")]; tensor var_4096_cast_fp16 = mul(x = current_value_37_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_4096_cast_fp16")]; tensor var_4098_cast_fp16 = mul(x = var_138_cast_fp16_18, y = var_241_cast_fp16)[name = tensor("op_4098_cast_fp16")]; tensor value_73_cast_fp16 = add(x = var_4096_cast_fp16, y = var_4098_cast_fp16)[name = tensor("value_73_cast_fp16")]; tensor var_4101 = const()[name = tensor("op_4101"), val = tensor([1, 20, 64, -1])]; tensor var_4102_cast_fp16 = reshape(shape = var_4101, x = query_73_cast_fp16)[name = tensor("op_4102_cast_fp16")]; tensor var_4103_to_fp16 = const()[name = tensor("op_4103_to_fp16"), val = tensor(0x1p-3)]; tensor var_4104_cast_fp16 = mul(x = var_4102_cast_fp16, y = var_4103_to_fp16)[name = tensor("op_4104_cast_fp16")]; tensor var_4105 = const()[name = tensor("op_4105"), val = tensor([1, 20, 64, -1])]; tensor var_4106_cast_fp16 = reshape(shape = var_4105, x = key_73_cast_fp16)[name = tensor("op_4106_cast_fp16")]; tensor mh_w_109_transpose_x_0 = const()[name = tensor("mh_w_109_transpose_x_0"), val = tensor(true)]; tensor mh_w_109_transpose_y_0 = const()[name = tensor("mh_w_109_transpose_y_0"), val = tensor(false)]; tensor mh_w_109_cast_fp16 = matmul(transpose_x = mh_w_109_transpose_x_0, transpose_y = mh_w_109_transpose_y_0, x = var_4104_cast_fp16, y = var_4106_cast_fp16)[name = tensor("mh_w_109_cast_fp16")]; tensor mh_w_111_cast_fp16 = add(x = mh_w_109_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_111_cast_fp16")]; tensor var_4114_cast_fp16 = softmax(axis = var_4028, x = mh_w_111_cast_fp16)[name = tensor("op_4114_cast_fp16")]; tensor var_4115 = const()[name = tensor("op_4115"), val = tensor([1, 20, 64, -1])]; tensor var_4116_cast_fp16 = reshape(shape = var_4115, x = value_73_cast_fp16)[name = tensor("op_4116_cast_fp16")]; tensor attn_73_transpose_x_0 = const()[name = tensor("attn_73_transpose_x_0"), val = tensor(false)]; tensor attn_73_transpose_y_0 = const()[name = tensor("attn_73_transpose_y_0"), val = tensor(true)]; tensor attn_73_cast_fp16 = matmul(transpose_x = attn_73_transpose_x_0, transpose_y = attn_73_transpose_y_0, x = var_4116_cast_fp16, y = var_4114_cast_fp16)[name = tensor("attn_73_cast_fp16")]; tensor var_4119 = const()[name = tensor("op_4119"), val = tensor([1, 1280, 1, -1])]; tensor input_181_cast_fp16 = reshape(shape = var_4119, x = attn_73_cast_fp16)[name = tensor("input_181_cast_fp16")]; tensor var_4123 = const()[name = tensor("op_4123"), val = tensor([1, 1])]; tensor var_4125 = const()[name = tensor("op_4125"), val = tensor([1, 1])]; tensor obj_223_pad_type_0 = const()[name = tensor("obj_223_pad_type_0"), val = tensor("custom")]; tensor obj_223_pad_0 = const()[name = tensor("obj_223_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_18_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(529476160))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(530705024))), name = tensor("layers_18_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_18_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_18_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(530705216)))]; tensor obj_223_cast_fp16 = conv(bias = layers_18_self_attn_o_proj_bias_to_fp16, dilations = var_4125, groups = var_4035, pad = obj_223_pad_0, pad_type = obj_223_pad_type_0, strides = var_4123, weight = layers_18_self_attn_o_proj_weight_to_fp16_palettized, x = input_181_cast_fp16)[name = tensor("obj_223_cast_fp16")]; tensor inputs_111_cast_fp16 = add(x = inputs_109_cast_fp16, y = obj_223_cast_fp16)[name = tensor("inputs_111_cast_fp16")]; tensor var_4135 = const()[name = tensor("op_4135"), val = tensor([1])]; tensor channels_mean_111_cast_fp16 = reduce_mean(axes = var_4135, keep_dims = var_4036, x = inputs_111_cast_fp16)[name = tensor("channels_mean_111_cast_fp16")]; tensor zero_mean_111_cast_fp16 = sub(x = inputs_111_cast_fp16, y = channels_mean_111_cast_fp16)[name = tensor("zero_mean_111_cast_fp16")]; tensor zero_mean_sq_111_cast_fp16 = mul(x = zero_mean_111_cast_fp16, y = zero_mean_111_cast_fp16)[name = tensor("zero_mean_sq_111_cast_fp16")]; tensor var_4139 = const()[name = tensor("op_4139"), val = tensor([1])]; tensor var_4140_cast_fp16 = reduce_mean(axes = var_4139, keep_dims = var_4036, x = zero_mean_sq_111_cast_fp16)[name = tensor("op_4140_cast_fp16")]; tensor var_4141_to_fp16 = const()[name = tensor("op_4141_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4142_cast_fp16 = add(x = var_4140_cast_fp16, y = var_4141_to_fp16)[name = tensor("op_4142_cast_fp16")]; tensor denom_111_epsilon_0 = const()[name = tensor("denom_111_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_111_cast_fp16 = rsqrt(epsilon = denom_111_epsilon_0, x = var_4142_cast_fp16)[name = tensor("denom_111_cast_fp16")]; tensor out_111_cast_fp16 = mul(x = zero_mean_111_cast_fp16, y = denom_111_cast_fp16)[name = tensor("out_111_cast_fp16")]; tensor obj_225_gamma_0_to_fp16 = const()[name = tensor("obj_225_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(530707840)))]; tensor obj_225_beta_0_to_fp16 = const()[name = tensor("obj_225_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(530710464)))]; tensor obj_225_epsilon_0_to_fp16 = const()[name = tensor("obj_225_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_225_cast_fp16 = batch_norm(beta = obj_225_beta_0_to_fp16, epsilon = obj_225_epsilon_0_to_fp16, gamma = obj_225_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_111_cast_fp16)[name = tensor("obj_225_cast_fp16")]; tensor var_4157 = const()[name = tensor("op_4157"), val = tensor([1, 1])]; tensor var_4159 = const()[name = tensor("op_4159"), val = tensor([1, 1])]; tensor query_75_pad_type_0 = const()[name = tensor("query_75_pad_type_0"), val = tensor("custom")]; tensor query_75_pad_0 = const()[name = tensor("query_75_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_18_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(530713088))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(531941952))), name = tensor("layers_18_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_18_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_18_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(531942144)))]; tensor query_75_cast_fp16 = conv(bias = layers_18_encoder_attn_q_proj_bias_to_fp16, dilations = var_4159, groups = var_4035, pad = query_75_pad_0, pad_type = query_75_pad_type_0, strides = var_4157, weight = layers_18_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_225_cast_fp16)[name = tensor("query_75_cast_fp16")]; tensor var_4163 = const()[name = tensor("op_4163"), val = tensor([1, 1])]; tensor var_4165 = const()[name = tensor("op_4165"), val = tensor([1, 1])]; tensor key_75_pad_type_0 = const()[name = tensor("key_75_pad_type_0"), val = tensor("custom")]; tensor key_75_pad_0 = const()[name = tensor("key_75_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_18_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(531944768))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(533173632))), name = tensor("layers_18_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_75_cast_fp16 = conv(dilations = var_4165, groups = var_4035, pad = key_75_pad_0, pad_type = key_75_pad_type_0, strides = var_4163, weight = layers_18_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_75_cast_fp16")]; tensor var_4170 = const()[name = tensor("op_4170"), val = tensor([1, 1])]; tensor var_4172 = const()[name = tensor("op_4172"), val = tensor([1, 1])]; tensor value_75_pad_type_0 = const()[name = tensor("value_75_pad_type_0"), val = tensor("custom")]; tensor value_75_pad_0 = const()[name = tensor("value_75_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_18_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(533173824))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(534402688))), name = tensor("layers_18_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_18_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_18_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(534402880)))]; tensor value_75_cast_fp16 = conv(bias = layers_18_encoder_attn_v_proj_bias_to_fp16, dilations = var_4172, groups = var_4035, pad = value_75_pad_0, pad_type = value_75_pad_type_0, strides = var_4170, weight = layers_18_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_75_cast_fp16")]; tensor var_4176 = const()[name = tensor("op_4176"), val = tensor([1, 20, 64, -1])]; tensor var_4177_cast_fp16 = reshape(shape = var_4176, x = query_75_cast_fp16)[name = tensor("op_4177_cast_fp16")]; tensor var_4178_to_fp16 = const()[name = tensor("op_4178_to_fp16"), val = tensor(0x1p-3)]; tensor var_4179_cast_fp16 = mul(x = var_4177_cast_fp16, y = var_4178_to_fp16)[name = tensor("op_4179_cast_fp16")]; tensor var_4180 = const()[name = tensor("op_4180"), val = tensor([1, 20, 64, -1])]; tensor var_4181_cast_fp16 = reshape(shape = var_4180, x = key_75_cast_fp16)[name = tensor("op_4181_cast_fp16")]; tensor mh_w_113_transpose_x_0 = const()[name = tensor("mh_w_113_transpose_x_0"), val = tensor(true)]; tensor mh_w_113_transpose_y_0 = const()[name = tensor("mh_w_113_transpose_y_0"), val = tensor(false)]; tensor mh_w_113_cast_fp16 = matmul(transpose_x = mh_w_113_transpose_x_0, transpose_y = mh_w_113_transpose_y_0, x = var_4179_cast_fp16, y = var_4181_cast_fp16)[name = tensor("mh_w_113_cast_fp16")]; tensor var_4184_cast_fp16 = softmax(axis = var_4028, x = mh_w_113_cast_fp16)[name = tensor("op_4184_cast_fp16")]; tensor var_4185 = const()[name = tensor("op_4185"), val = tensor([1, 20, 64, -1])]; tensor var_4186_cast_fp16 = reshape(shape = var_4185, x = value_75_cast_fp16)[name = tensor("op_4186_cast_fp16")]; tensor attn_75_transpose_x_0 = const()[name = tensor("attn_75_transpose_x_0"), val = tensor(false)]; tensor attn_75_transpose_y_0 = const()[name = tensor("attn_75_transpose_y_0"), val = tensor(true)]; tensor attn_75_cast_fp16 = matmul(transpose_x = attn_75_transpose_x_0, transpose_y = attn_75_transpose_y_0, x = var_4186_cast_fp16, y = var_4184_cast_fp16)[name = tensor("attn_75_cast_fp16")]; tensor var_4189 = const()[name = tensor("op_4189"), val = tensor([1, 1280, 1, -1])]; tensor input_183_cast_fp16 = reshape(shape = var_4189, x = attn_75_cast_fp16)[name = tensor("input_183_cast_fp16")]; tensor var_4193 = const()[name = tensor("op_4193"), val = tensor([1, 1])]; tensor var_4195 = const()[name = tensor("op_4195"), val = tensor([1, 1])]; tensor obj_227_pad_type_0 = const()[name = tensor("obj_227_pad_type_0"), val = tensor("custom")]; tensor obj_227_pad_0 = const()[name = tensor("obj_227_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_18_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(534405504))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535634368))), name = tensor("layers_18_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_18_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_18_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535634560)))]; tensor obj_227_cast_fp16 = conv(bias = layers_18_encoder_attn_o_proj_bias_to_fp16, dilations = var_4195, groups = var_4035, pad = obj_227_pad_0, pad_type = obj_227_pad_type_0, strides = var_4193, weight = layers_18_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_183_cast_fp16)[name = tensor("obj_227_cast_fp16")]; tensor inputs_113_cast_fp16 = add(x = inputs_111_cast_fp16, y = obj_227_cast_fp16)[name = tensor("inputs_113_cast_fp16")]; tensor var_4201 = const()[name = tensor("op_4201"), val = tensor([1])]; tensor channels_mean_113_cast_fp16 = reduce_mean(axes = var_4201, keep_dims = var_4036, x = inputs_113_cast_fp16)[name = tensor("channels_mean_113_cast_fp16")]; tensor zero_mean_113_cast_fp16 = sub(x = inputs_113_cast_fp16, y = channels_mean_113_cast_fp16)[name = tensor("zero_mean_113_cast_fp16")]; tensor zero_mean_sq_113_cast_fp16 = mul(x = zero_mean_113_cast_fp16, y = zero_mean_113_cast_fp16)[name = tensor("zero_mean_sq_113_cast_fp16")]; tensor var_4205 = const()[name = tensor("op_4205"), val = tensor([1])]; tensor var_4206_cast_fp16 = reduce_mean(axes = var_4205, keep_dims = var_4036, x = zero_mean_sq_113_cast_fp16)[name = tensor("op_4206_cast_fp16")]; tensor var_4207_to_fp16 = const()[name = tensor("op_4207_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4208_cast_fp16 = add(x = var_4206_cast_fp16, y = var_4207_to_fp16)[name = tensor("op_4208_cast_fp16")]; tensor denom_113_epsilon_0 = const()[name = tensor("denom_113_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_113_cast_fp16 = rsqrt(epsilon = denom_113_epsilon_0, x = var_4208_cast_fp16)[name = tensor("denom_113_cast_fp16")]; tensor out_113_cast_fp16 = mul(x = zero_mean_113_cast_fp16, y = denom_113_cast_fp16)[name = tensor("out_113_cast_fp16")]; tensor input_185_gamma_0_to_fp16 = const()[name = tensor("input_185_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535637184)))]; tensor input_185_beta_0_to_fp16 = const()[name = tensor("input_185_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535639808)))]; tensor input_185_epsilon_0_to_fp16 = const()[name = tensor("input_185_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_185_cast_fp16 = batch_norm(beta = input_185_beta_0_to_fp16, epsilon = input_185_epsilon_0_to_fp16, gamma = input_185_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_113_cast_fp16)[name = tensor("input_185_cast_fp16")]; tensor var_4219 = const()[name = tensor("op_4219"), val = tensor([1, 1])]; tensor var_4221 = const()[name = tensor("op_4221"), val = tensor([1, 1])]; tensor input_187_pad_type_0 = const()[name = tensor("input_187_pad_type_0"), val = tensor("custom")]; tensor input_187_pad_0 = const()[name = tensor("input_187_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_18_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(535642432))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(540557696))), name = tensor("layers_18_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_18_fc1_bias_to_fp16 = const()[name = tensor("layers_18_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(540557888)))]; tensor input_187_cast_fp16 = conv(bias = layers_18_fc1_bias_to_fp16, dilations = var_4221, groups = var_4035, pad = input_187_pad_0, pad_type = input_187_pad_type_0, strides = var_4219, weight = layers_18_fc1_weight_to_fp16_palettized, x = input_185_cast_fp16)[name = tensor("input_187_cast_fp16")]; tensor input_189_mode_0 = const()[name = tensor("input_189_mode_0"), val = tensor("EXACT")]; tensor input_189_cast_fp16 = gelu(mode = input_189_mode_0, x = input_187_cast_fp16)[name = tensor("input_189_cast_fp16")]; tensor var_4227 = const()[name = tensor("op_4227"), val = tensor([1, 1])]; tensor var_4229 = const()[name = tensor("op_4229"), val = tensor([1, 1])]; tensor hidden_states_39_pad_type_0 = const()[name = tensor("hidden_states_39_pad_type_0"), val = tensor("custom")]; tensor hidden_states_39_pad_0 = const()[name = tensor("hidden_states_39_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_18_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(540568192))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(545483456))), name = tensor("layers_18_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_18_fc2_bias_to_fp16 = const()[name = tensor("layers_18_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(545483648)))]; tensor hidden_states_39_cast_fp16 = conv(bias = layers_18_fc2_bias_to_fp16, dilations = var_4229, groups = var_4035, pad = hidden_states_39_pad_0, pad_type = hidden_states_39_pad_type_0, strides = var_4227, weight = layers_18_fc2_weight_to_fp16_palettized, x = input_189_cast_fp16)[name = tensor("hidden_states_39_cast_fp16")]; tensor inputs_115_cast_fp16 = add(x = inputs_113_cast_fp16, y = hidden_states_39_cast_fp16)[name = tensor("inputs_115_cast_fp16")]; tensor var_4242 = const()[name = tensor("op_4242"), val = tensor(3)]; tensor var_4249 = const()[name = tensor("op_4249"), val = tensor(1)]; tensor var_4250 = const()[name = tensor("op_4250"), val = tensor(true)]; tensor var_4262 = const()[name = tensor("op_4262"), val = tensor([1])]; tensor channels_mean_115_cast_fp16 = reduce_mean(axes = var_4262, keep_dims = var_4250, x = inputs_115_cast_fp16)[name = tensor("channels_mean_115_cast_fp16")]; tensor zero_mean_115_cast_fp16 = sub(x = inputs_115_cast_fp16, y = channels_mean_115_cast_fp16)[name = tensor("zero_mean_115_cast_fp16")]; tensor zero_mean_sq_115_cast_fp16 = mul(x = zero_mean_115_cast_fp16, y = zero_mean_115_cast_fp16)[name = tensor("zero_mean_sq_115_cast_fp16")]; tensor var_4266 = const()[name = tensor("op_4266"), val = tensor([1])]; tensor var_4267_cast_fp16 = reduce_mean(axes = var_4266, keep_dims = var_4250, x = zero_mean_sq_115_cast_fp16)[name = tensor("op_4267_cast_fp16")]; tensor var_4268_to_fp16 = const()[name = tensor("op_4268_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4269_cast_fp16 = add(x = var_4267_cast_fp16, y = var_4268_to_fp16)[name = tensor("op_4269_cast_fp16")]; tensor denom_115_epsilon_0 = const()[name = tensor("denom_115_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_115_cast_fp16 = rsqrt(epsilon = denom_115_epsilon_0, x = var_4269_cast_fp16)[name = tensor("denom_115_cast_fp16")]; tensor out_115_cast_fp16 = mul(x = zero_mean_115_cast_fp16, y = denom_115_cast_fp16)[name = tensor("out_115_cast_fp16")]; tensor obj_229_gamma_0_to_fp16 = const()[name = tensor("obj_229_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(545486272)))]; tensor obj_229_beta_0_to_fp16 = const()[name = tensor("obj_229_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(545488896)))]; tensor obj_229_epsilon_0_to_fp16 = const()[name = tensor("obj_229_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_229_cast_fp16 = batch_norm(beta = obj_229_beta_0_to_fp16, epsilon = obj_229_epsilon_0_to_fp16, gamma = obj_229_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_115_cast_fp16)[name = tensor("obj_229_cast_fp16")]; tensor var_4284 = const()[name = tensor("op_4284"), val = tensor([1, 1])]; tensor var_4286 = const()[name = tensor("op_4286"), val = tensor([1, 1])]; tensor query_77_pad_type_0 = const()[name = tensor("query_77_pad_type_0"), val = tensor("custom")]; tensor query_77_pad_0 = const()[name = tensor("query_77_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_19_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(545491520))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(546310784))), name = tensor("layers_19_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_19_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_19_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(546310912)))]; tensor query_77_cast_fp16 = conv(bias = layers_19_self_attn_q_proj_bias_to_fp16, dilations = var_4286, groups = var_4249, pad = query_77_pad_0, pad_type = query_77_pad_type_0, strides = var_4284, weight = layers_19_self_attn_q_proj_weight_to_fp16_palettized, x = obj_229_cast_fp16)[name = tensor("query_77_cast_fp16")]; tensor var_4290 = const()[name = tensor("op_4290"), val = tensor([1, 1])]; tensor var_4292 = const()[name = tensor("op_4292"), val = tensor([1, 1])]; tensor current_key_39_pad_type_0 = const()[name = tensor("current_key_39_pad_type_0"), val = tensor("custom")]; tensor current_key_39_pad_0 = const()[name = tensor("current_key_39_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_19_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(546313536))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547132800))), name = tensor("layers_19_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_39_cast_fp16 = conv(dilations = var_4292, groups = var_4249, pad = current_key_39_pad_0, pad_type = current_key_39_pad_type_0, strides = var_4290, weight = layers_19_self_attn_k_proj_weight_to_fp16_palettized, x = obj_229_cast_fp16)[name = tensor("current_key_39_cast_fp16")]; tensor var_4297 = const()[name = tensor("op_4297"), val = tensor([1, 1])]; tensor var_4299 = const()[name = tensor("op_4299"), val = tensor([1, 1])]; tensor current_value_39_pad_type_0 = const()[name = tensor("current_value_39_pad_type_0"), val = tensor("custom")]; tensor current_value_39_pad_0 = const()[name = tensor("current_value_39_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_19_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547132928))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547952192))), name = tensor("layers_19_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_19_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_19_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547952320)))]; tensor current_value_39_cast_fp16 = conv(bias = layers_19_self_attn_v_proj_bias_to_fp16, dilations = var_4299, groups = var_4249, pad = current_value_39_pad_0, pad_type = current_value_39_pad_type_0, strides = var_4297, weight = layers_19_self_attn_v_proj_weight_to_fp16_palettized, x = obj_229_cast_fp16)[name = tensor("current_value_39_cast_fp16")]; tensor var_4306_cast_fp16 = mul(x = current_key_39_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_4306_cast_fp16")]; tensor var_4308_cast_fp16 = mul(x = var_103_cast_fp16_19, y = var_241_cast_fp16)[name = tensor("op_4308_cast_fp16")]; tensor key_77_cast_fp16 = add(x = var_4306_cast_fp16, y = var_4308_cast_fp16)[name = tensor("key_77_cast_fp16")]; tensor var_4310_cast_fp16 = mul(x = current_value_39_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_4310_cast_fp16")]; tensor var_4312_cast_fp16 = mul(x = var_138_cast_fp16_19, y = var_241_cast_fp16)[name = tensor("op_4312_cast_fp16")]; tensor value_77_cast_fp16 = add(x = var_4310_cast_fp16, y = var_4312_cast_fp16)[name = tensor("value_77_cast_fp16")]; tensor var_4315 = const()[name = tensor("op_4315"), val = tensor([1, 20, 64, -1])]; tensor var_4316_cast_fp16 = reshape(shape = var_4315, x = query_77_cast_fp16)[name = tensor("op_4316_cast_fp16")]; tensor var_4317_to_fp16 = const()[name = tensor("op_4317_to_fp16"), val = tensor(0x1p-3)]; tensor var_4318_cast_fp16 = mul(x = var_4316_cast_fp16, y = var_4317_to_fp16)[name = tensor("op_4318_cast_fp16")]; tensor var_4319 = const()[name = tensor("op_4319"), val = tensor([1, 20, 64, -1])]; tensor var_4320_cast_fp16 = reshape(shape = var_4319, x = key_77_cast_fp16)[name = tensor("op_4320_cast_fp16")]; tensor mh_w_115_transpose_x_0 = const()[name = tensor("mh_w_115_transpose_x_0"), val = tensor(true)]; tensor mh_w_115_transpose_y_0 = const()[name = tensor("mh_w_115_transpose_y_0"), val = tensor(false)]; tensor mh_w_115_cast_fp16 = matmul(transpose_x = mh_w_115_transpose_x_0, transpose_y = mh_w_115_transpose_y_0, x = var_4318_cast_fp16, y = var_4320_cast_fp16)[name = tensor("mh_w_115_cast_fp16")]; tensor mh_w_117_cast_fp16 = add(x = mh_w_115_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_117_cast_fp16")]; tensor var_4328_cast_fp16 = softmax(axis = var_4242, x = mh_w_117_cast_fp16)[name = tensor("op_4328_cast_fp16")]; tensor var_4329 = const()[name = tensor("op_4329"), val = tensor([1, 20, 64, -1])]; tensor var_4330_cast_fp16 = reshape(shape = var_4329, x = value_77_cast_fp16)[name = tensor("op_4330_cast_fp16")]; tensor attn_77_transpose_x_0 = const()[name = tensor("attn_77_transpose_x_0"), val = tensor(false)]; tensor attn_77_transpose_y_0 = const()[name = tensor("attn_77_transpose_y_0"), val = tensor(true)]; tensor attn_77_cast_fp16 = matmul(transpose_x = attn_77_transpose_x_0, transpose_y = attn_77_transpose_y_0, x = var_4330_cast_fp16, y = var_4328_cast_fp16)[name = tensor("attn_77_cast_fp16")]; tensor var_4333 = const()[name = tensor("op_4333"), val = tensor([1, 1280, 1, -1])]; tensor input_191_cast_fp16 = reshape(shape = var_4333, x = attn_77_cast_fp16)[name = tensor("input_191_cast_fp16")]; tensor var_4337 = const()[name = tensor("op_4337"), val = tensor([1, 1])]; tensor var_4339 = const()[name = tensor("op_4339"), val = tensor([1, 1])]; tensor obj_235_pad_type_0 = const()[name = tensor("obj_235_pad_type_0"), val = tensor("custom")]; tensor obj_235_pad_0 = const()[name = tensor("obj_235_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_19_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547954944))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(548774208))), name = tensor("layers_19_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_19_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_19_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(548774336)))]; tensor obj_235_cast_fp16 = conv(bias = layers_19_self_attn_o_proj_bias_to_fp16, dilations = var_4339, groups = var_4249, pad = obj_235_pad_0, pad_type = obj_235_pad_type_0, strides = var_4337, weight = layers_19_self_attn_o_proj_weight_to_fp16_palettized, x = input_191_cast_fp16)[name = tensor("obj_235_cast_fp16")]; tensor inputs_117_cast_fp16 = add(x = inputs_115_cast_fp16, y = obj_235_cast_fp16)[name = tensor("inputs_117_cast_fp16")]; tensor var_4349 = const()[name = tensor("op_4349"), val = tensor([1])]; tensor channels_mean_117_cast_fp16 = reduce_mean(axes = var_4349, keep_dims = var_4250, x = inputs_117_cast_fp16)[name = tensor("channels_mean_117_cast_fp16")]; tensor zero_mean_117_cast_fp16 = sub(x = inputs_117_cast_fp16, y = channels_mean_117_cast_fp16)[name = tensor("zero_mean_117_cast_fp16")]; tensor zero_mean_sq_117_cast_fp16 = mul(x = zero_mean_117_cast_fp16, y = zero_mean_117_cast_fp16)[name = tensor("zero_mean_sq_117_cast_fp16")]; tensor var_4353 = const()[name = tensor("op_4353"), val = tensor([1])]; tensor var_4354_cast_fp16 = reduce_mean(axes = var_4353, keep_dims = var_4250, x = zero_mean_sq_117_cast_fp16)[name = tensor("op_4354_cast_fp16")]; tensor var_4355_to_fp16 = const()[name = tensor("op_4355_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4356_cast_fp16 = add(x = var_4354_cast_fp16, y = var_4355_to_fp16)[name = tensor("op_4356_cast_fp16")]; tensor denom_117_epsilon_0 = const()[name = tensor("denom_117_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_117_cast_fp16 = rsqrt(epsilon = denom_117_epsilon_0, x = var_4356_cast_fp16)[name = tensor("denom_117_cast_fp16")]; tensor out_117_cast_fp16 = mul(x = zero_mean_117_cast_fp16, y = denom_117_cast_fp16)[name = tensor("out_117_cast_fp16")]; tensor obj_237_gamma_0_to_fp16 = const()[name = tensor("obj_237_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(548776960)))]; tensor obj_237_beta_0_to_fp16 = const()[name = tensor("obj_237_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(548779584)))]; tensor obj_237_epsilon_0_to_fp16 = const()[name = tensor("obj_237_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_237_cast_fp16 = batch_norm(beta = obj_237_beta_0_to_fp16, epsilon = obj_237_epsilon_0_to_fp16, gamma = obj_237_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_117_cast_fp16)[name = tensor("obj_237_cast_fp16")]; tensor var_4371 = const()[name = tensor("op_4371"), val = tensor([1, 1])]; tensor var_4373 = const()[name = tensor("op_4373"), val = tensor([1, 1])]; tensor query_79_pad_type_0 = const()[name = tensor("query_79_pad_type_0"), val = tensor("custom")]; tensor query_79_pad_0 = const()[name = tensor("query_79_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_19_encoder_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_19_encoder_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(548782208)))]; tensor layers_19_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_19_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(552059072)))]; tensor query_79_cast_fp16 = conv(bias = layers_19_encoder_attn_q_proj_bias_to_fp16, dilations = var_4373, groups = var_4249, pad = query_79_pad_0, pad_type = query_79_pad_type_0, strides = var_4371, weight = layers_19_encoder_attn_q_proj_weight_to_fp16, x = obj_237_cast_fp16)[name = tensor("query_79_cast_fp16")]; tensor var_4377 = const()[name = tensor("op_4377"), val = tensor([1, 1])]; tensor var_4379 = const()[name = tensor("op_4379"), val = tensor([1, 1])]; tensor key_79_pad_type_0 = const()[name = tensor("key_79_pad_type_0"), val = tensor("custom")]; tensor key_79_pad_0 = const()[name = tensor("key_79_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_19_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(552061696))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(553290560))), name = tensor("layers_19_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_79_cast_fp16 = conv(dilations = var_4379, groups = var_4249, pad = key_79_pad_0, pad_type = key_79_pad_type_0, strides = var_4377, weight = layers_19_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_79_cast_fp16")]; tensor var_4384 = const()[name = tensor("op_4384"), val = tensor([1, 1])]; tensor var_4386 = const()[name = tensor("op_4386"), val = tensor([1, 1])]; tensor value_79_pad_type_0 = const()[name = tensor("value_79_pad_type_0"), val = tensor("custom")]; tensor value_79_pad_0 = const()[name = tensor("value_79_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_19_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(553290752))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(554519616))), name = tensor("layers_19_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_19_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_19_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(554519808)))]; tensor value_79_cast_fp16 = conv(bias = layers_19_encoder_attn_v_proj_bias_to_fp16, dilations = var_4386, groups = var_4249, pad = value_79_pad_0, pad_type = value_79_pad_type_0, strides = var_4384, weight = layers_19_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_79_cast_fp16")]; tensor var_4390 = const()[name = tensor("op_4390"), val = tensor([1, 20, 64, -1])]; tensor var_4391_cast_fp16 = reshape(shape = var_4390, x = query_79_cast_fp16)[name = tensor("op_4391_cast_fp16")]; tensor var_4392_to_fp16 = const()[name = tensor("op_4392_to_fp16"), val = tensor(0x1p-3)]; tensor var_4393_cast_fp16 = mul(x = var_4391_cast_fp16, y = var_4392_to_fp16)[name = tensor("op_4393_cast_fp16")]; tensor var_4394 = const()[name = tensor("op_4394"), val = tensor([1, 20, 64, -1])]; tensor var_4395_cast_fp16 = reshape(shape = var_4394, x = key_79_cast_fp16)[name = tensor("op_4395_cast_fp16")]; tensor mh_w_119_transpose_x_0 = const()[name = tensor("mh_w_119_transpose_x_0"), val = tensor(true)]; tensor mh_w_119_transpose_y_0 = const()[name = tensor("mh_w_119_transpose_y_0"), val = tensor(false)]; tensor mh_w_119_cast_fp16 = matmul(transpose_x = mh_w_119_transpose_x_0, transpose_y = mh_w_119_transpose_y_0, x = var_4393_cast_fp16, y = var_4395_cast_fp16)[name = tensor("mh_w_119_cast_fp16")]; tensor var_4398_cast_fp16 = softmax(axis = var_4242, x = mh_w_119_cast_fp16)[name = tensor("op_4398_cast_fp16")]; tensor var_4399 = const()[name = tensor("op_4399"), val = tensor([1, 20, 64, -1])]; tensor var_4400_cast_fp16 = reshape(shape = var_4399, x = value_79_cast_fp16)[name = tensor("op_4400_cast_fp16")]; tensor attn_79_transpose_x_0 = const()[name = tensor("attn_79_transpose_x_0"), val = tensor(false)]; tensor attn_79_transpose_y_0 = const()[name = tensor("attn_79_transpose_y_0"), val = tensor(true)]; tensor attn_79_cast_fp16 = matmul(transpose_x = attn_79_transpose_x_0, transpose_y = attn_79_transpose_y_0, x = var_4400_cast_fp16, y = var_4398_cast_fp16)[name = tensor("attn_79_cast_fp16")]; tensor var_4403 = const()[name = tensor("op_4403"), val = tensor([1, 1280, 1, -1])]; tensor input_193_cast_fp16 = reshape(shape = var_4403, x = attn_79_cast_fp16)[name = tensor("input_193_cast_fp16")]; tensor var_4407 = const()[name = tensor("op_4407"), val = tensor([1, 1])]; tensor var_4409 = const()[name = tensor("op_4409"), val = tensor([1, 1])]; tensor obj_239_pad_type_0 = const()[name = tensor("obj_239_pad_type_0"), val = tensor("custom")]; tensor obj_239_pad_0 = const()[name = tensor("obj_239_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_19_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(554522432))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(556160896))), name = tensor("layers_19_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_19_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_19_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(556161472)))]; tensor obj_239_cast_fp16 = conv(bias = layers_19_encoder_attn_o_proj_bias_to_fp16, dilations = var_4409, groups = var_4249, pad = obj_239_pad_0, pad_type = obj_239_pad_type_0, strides = var_4407, weight = layers_19_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_193_cast_fp16)[name = tensor("obj_239_cast_fp16")]; tensor inputs_119_cast_fp16 = add(x = inputs_117_cast_fp16, y = obj_239_cast_fp16)[name = tensor("inputs_119_cast_fp16")]; tensor var_4415 = const()[name = tensor("op_4415"), val = tensor([1])]; tensor channels_mean_119_cast_fp16 = reduce_mean(axes = var_4415, keep_dims = var_4250, x = inputs_119_cast_fp16)[name = tensor("channels_mean_119_cast_fp16")]; tensor zero_mean_119_cast_fp16 = sub(x = inputs_119_cast_fp16, y = channels_mean_119_cast_fp16)[name = tensor("zero_mean_119_cast_fp16")]; tensor zero_mean_sq_119_cast_fp16 = mul(x = zero_mean_119_cast_fp16, y = zero_mean_119_cast_fp16)[name = tensor("zero_mean_sq_119_cast_fp16")]; tensor var_4419 = const()[name = tensor("op_4419"), val = tensor([1])]; tensor var_4420_cast_fp16 = reduce_mean(axes = var_4419, keep_dims = var_4250, x = zero_mean_sq_119_cast_fp16)[name = tensor("op_4420_cast_fp16")]; tensor var_4421_to_fp16 = const()[name = tensor("op_4421_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4422_cast_fp16 = add(x = var_4420_cast_fp16, y = var_4421_to_fp16)[name = tensor("op_4422_cast_fp16")]; tensor denom_119_epsilon_0 = const()[name = tensor("denom_119_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_119_cast_fp16 = rsqrt(epsilon = denom_119_epsilon_0, x = var_4422_cast_fp16)[name = tensor("denom_119_cast_fp16")]; tensor out_119_cast_fp16 = mul(x = zero_mean_119_cast_fp16, y = denom_119_cast_fp16)[name = tensor("out_119_cast_fp16")]; tensor input_195_gamma_0_to_fp16 = const()[name = tensor("input_195_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(556164096)))]; tensor input_195_beta_0_to_fp16 = const()[name = tensor("input_195_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(556166720)))]; tensor input_195_epsilon_0_to_fp16 = const()[name = tensor("input_195_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_195_cast_fp16 = batch_norm(beta = input_195_beta_0_to_fp16, epsilon = input_195_epsilon_0_to_fp16, gamma = input_195_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_119_cast_fp16)[name = tensor("input_195_cast_fp16")]; tensor var_4433 = const()[name = tensor("op_4433"), val = tensor([1, 1])]; tensor var_4435 = const()[name = tensor("op_4435"), val = tensor([1, 1])]; tensor input_197_pad_type_0 = const()[name = tensor("input_197_pad_type_0"), val = tensor("custom")]; tensor input_197_pad_0 = const()[name = tensor("input_197_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_19_fc1_weight_to_fp16 = const()[name = tensor("layers_19_fc1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(556169344)))]; tensor layers_19_fc1_bias_to_fp16 = const()[name = tensor("layers_19_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(569276608)))]; tensor input_197_cast_fp16 = conv(bias = layers_19_fc1_bias_to_fp16, dilations = var_4435, groups = var_4249, pad = input_197_pad_0, pad_type = input_197_pad_type_0, strides = var_4433, weight = layers_19_fc1_weight_to_fp16, x = input_195_cast_fp16)[name = tensor("input_197_cast_fp16")]; tensor input_199_mode_0 = const()[name = tensor("input_199_mode_0"), val = tensor("EXACT")]; tensor input_199_cast_fp16 = gelu(mode = input_199_mode_0, x = input_197_cast_fp16)[name = tensor("input_199_cast_fp16")]; tensor var_4441 = const()[name = tensor("op_4441"), val = tensor([1, 1])]; tensor var_4443 = const()[name = tensor("op_4443"), val = tensor([1, 1])]; tensor hidden_states_41_pad_type_0 = const()[name = tensor("hidden_states_41_pad_type_0"), val = tensor("custom")]; tensor hidden_states_41_pad_0 = const()[name = tensor("hidden_states_41_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_19_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(569286912))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575840576))), name = tensor("layers_19_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_19_fc2_bias_to_fp16 = const()[name = tensor("layers_19_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575841152)))]; tensor hidden_states_41_cast_fp16 = conv(bias = layers_19_fc2_bias_to_fp16, dilations = var_4443, groups = var_4249, pad = hidden_states_41_pad_0, pad_type = hidden_states_41_pad_type_0, strides = var_4441, weight = layers_19_fc2_weight_to_fp16_palettized, x = input_199_cast_fp16)[name = tensor("hidden_states_41_cast_fp16")]; tensor inputs_121_cast_fp16 = add(x = inputs_119_cast_fp16, y = hidden_states_41_cast_fp16)[name = tensor("inputs_121_cast_fp16")]; tensor var_4456 = const()[name = tensor("op_4456"), val = tensor(3)]; tensor var_4463 = const()[name = tensor("op_4463"), val = tensor(1)]; tensor var_4464 = const()[name = tensor("op_4464"), val = tensor(true)]; tensor var_4476 = const()[name = tensor("op_4476"), val = tensor([1])]; tensor channels_mean_121_cast_fp16 = reduce_mean(axes = var_4476, keep_dims = var_4464, x = inputs_121_cast_fp16)[name = tensor("channels_mean_121_cast_fp16")]; tensor zero_mean_121_cast_fp16 = sub(x = inputs_121_cast_fp16, y = channels_mean_121_cast_fp16)[name = tensor("zero_mean_121_cast_fp16")]; tensor zero_mean_sq_121_cast_fp16 = mul(x = zero_mean_121_cast_fp16, y = zero_mean_121_cast_fp16)[name = tensor("zero_mean_sq_121_cast_fp16")]; tensor var_4480 = const()[name = tensor("op_4480"), val = tensor([1])]; tensor var_4481_cast_fp16 = reduce_mean(axes = var_4480, keep_dims = var_4464, x = zero_mean_sq_121_cast_fp16)[name = tensor("op_4481_cast_fp16")]; tensor var_4482_to_fp16 = const()[name = tensor("op_4482_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4483_cast_fp16 = add(x = var_4481_cast_fp16, y = var_4482_to_fp16)[name = tensor("op_4483_cast_fp16")]; tensor denom_121_epsilon_0 = const()[name = tensor("denom_121_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_121_cast_fp16 = rsqrt(epsilon = denom_121_epsilon_0, x = var_4483_cast_fp16)[name = tensor("denom_121_cast_fp16")]; tensor out_121_cast_fp16 = mul(x = zero_mean_121_cast_fp16, y = denom_121_cast_fp16)[name = tensor("out_121_cast_fp16")]; tensor obj_241_gamma_0_to_fp16 = const()[name = tensor("obj_241_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575843776)))]; tensor obj_241_beta_0_to_fp16 = const()[name = tensor("obj_241_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575846400)))]; tensor obj_241_epsilon_0_to_fp16 = const()[name = tensor("obj_241_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_241_cast_fp16 = batch_norm(beta = obj_241_beta_0_to_fp16, epsilon = obj_241_epsilon_0_to_fp16, gamma = obj_241_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_121_cast_fp16)[name = tensor("obj_241_cast_fp16")]; tensor var_4498 = const()[name = tensor("op_4498"), val = tensor([1, 1])]; tensor var_4500 = const()[name = tensor("op_4500"), val = tensor([1, 1])]; tensor query_81_pad_type_0 = const()[name = tensor("query_81_pad_type_0"), val = tensor("custom")]; tensor query_81_pad_0 = const()[name = tensor("query_81_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_20_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(575849024))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(577077888))), name = tensor("layers_20_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_20_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_20_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(577078080)))]; tensor query_81_cast_fp16 = conv(bias = layers_20_self_attn_q_proj_bias_to_fp16, dilations = var_4500, groups = var_4463, pad = query_81_pad_0, pad_type = query_81_pad_type_0, strides = var_4498, weight = layers_20_self_attn_q_proj_weight_to_fp16_palettized, x = obj_241_cast_fp16)[name = tensor("query_81_cast_fp16")]; tensor var_4504 = const()[name = tensor("op_4504"), val = tensor([1, 1])]; tensor var_4506 = const()[name = tensor("op_4506"), val = tensor([1, 1])]; tensor current_key_41_pad_type_0 = const()[name = tensor("current_key_41_pad_type_0"), val = tensor("custom")]; tensor current_key_41_pad_0 = const()[name = tensor("current_key_41_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_20_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(577080704))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(577899968))), name = tensor("layers_20_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_41_cast_fp16 = conv(dilations = var_4506, groups = var_4463, pad = current_key_41_pad_0, pad_type = current_key_41_pad_type_0, strides = var_4504, weight = layers_20_self_attn_k_proj_weight_to_fp16_palettized, x = obj_241_cast_fp16)[name = tensor("current_key_41_cast_fp16")]; tensor var_4511 = const()[name = tensor("op_4511"), val = tensor([1, 1])]; tensor var_4513 = const()[name = tensor("op_4513"), val = tensor([1, 1])]; tensor current_value_41_pad_type_0 = const()[name = tensor("current_value_41_pad_type_0"), val = tensor("custom")]; tensor current_value_41_pad_0 = const()[name = tensor("current_value_41_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_20_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(577900096))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(578719360))), name = tensor("layers_20_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_20_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_20_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(578719488)))]; tensor current_value_41_cast_fp16 = conv(bias = layers_20_self_attn_v_proj_bias_to_fp16, dilations = var_4513, groups = var_4463, pad = current_value_41_pad_0, pad_type = current_value_41_pad_type_0, strides = var_4511, weight = layers_20_self_attn_v_proj_weight_to_fp16_palettized, x = obj_241_cast_fp16)[name = tensor("current_value_41_cast_fp16")]; tensor var_4520_cast_fp16 = mul(x = current_key_41_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_4520_cast_fp16")]; tensor var_4522_cast_fp16 = mul(x = var_103_cast_fp16_20, y = var_241_cast_fp16)[name = tensor("op_4522_cast_fp16")]; tensor key_81_cast_fp16 = add(x = var_4520_cast_fp16, y = var_4522_cast_fp16)[name = tensor("key_81_cast_fp16")]; tensor var_4524_cast_fp16 = mul(x = current_value_41_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_4524_cast_fp16")]; tensor var_4526_cast_fp16 = mul(x = var_138_cast_fp16_20, y = var_241_cast_fp16)[name = tensor("op_4526_cast_fp16")]; tensor value_81_cast_fp16 = add(x = var_4524_cast_fp16, y = var_4526_cast_fp16)[name = tensor("value_81_cast_fp16")]; tensor var_4529 = const()[name = tensor("op_4529"), val = tensor([1, 20, 64, -1])]; tensor var_4530_cast_fp16 = reshape(shape = var_4529, x = query_81_cast_fp16)[name = tensor("op_4530_cast_fp16")]; tensor var_4531_to_fp16 = const()[name = tensor("op_4531_to_fp16"), val = tensor(0x1p-3)]; tensor var_4532_cast_fp16 = mul(x = var_4530_cast_fp16, y = var_4531_to_fp16)[name = tensor("op_4532_cast_fp16")]; tensor var_4533 = const()[name = tensor("op_4533"), val = tensor([1, 20, 64, -1])]; tensor var_4534_cast_fp16 = reshape(shape = var_4533, x = key_81_cast_fp16)[name = tensor("op_4534_cast_fp16")]; tensor mh_w_121_transpose_x_0 = const()[name = tensor("mh_w_121_transpose_x_0"), val = tensor(true)]; tensor mh_w_121_transpose_y_0 = const()[name = tensor("mh_w_121_transpose_y_0"), val = tensor(false)]; tensor mh_w_121_cast_fp16 = matmul(transpose_x = mh_w_121_transpose_x_0, transpose_y = mh_w_121_transpose_y_0, x = var_4532_cast_fp16, y = var_4534_cast_fp16)[name = tensor("mh_w_121_cast_fp16")]; tensor mh_w_123_cast_fp16 = add(x = mh_w_121_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_123_cast_fp16")]; tensor var_4542_cast_fp16 = softmax(axis = var_4456, x = mh_w_123_cast_fp16)[name = tensor("op_4542_cast_fp16")]; tensor var_4543 = const()[name = tensor("op_4543"), val = tensor([1, 20, 64, -1])]; tensor var_4544_cast_fp16 = reshape(shape = var_4543, x = value_81_cast_fp16)[name = tensor("op_4544_cast_fp16")]; tensor attn_81_transpose_x_0 = const()[name = tensor("attn_81_transpose_x_0"), val = tensor(false)]; tensor attn_81_transpose_y_0 = const()[name = tensor("attn_81_transpose_y_0"), val = tensor(true)]; tensor attn_81_cast_fp16 = matmul(transpose_x = attn_81_transpose_x_0, transpose_y = attn_81_transpose_y_0, x = var_4544_cast_fp16, y = var_4542_cast_fp16)[name = tensor("attn_81_cast_fp16")]; tensor var_4547 = const()[name = tensor("op_4547"), val = tensor([1, 1280, 1, -1])]; tensor input_201_cast_fp16 = reshape(shape = var_4547, x = attn_81_cast_fp16)[name = tensor("input_201_cast_fp16")]; tensor var_4551 = const()[name = tensor("op_4551"), val = tensor([1, 1])]; tensor var_4553 = const()[name = tensor("op_4553"), val = tensor([1, 1])]; tensor obj_247_pad_type_0 = const()[name = tensor("obj_247_pad_type_0"), val = tensor("custom")]; tensor obj_247_pad_0 = const()[name = tensor("obj_247_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_20_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(578722112))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(579950976))), name = tensor("layers_20_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_20_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_20_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(579951168)))]; tensor obj_247_cast_fp16 = conv(bias = layers_20_self_attn_o_proj_bias_to_fp16, dilations = var_4553, groups = var_4463, pad = obj_247_pad_0, pad_type = obj_247_pad_type_0, strides = var_4551, weight = layers_20_self_attn_o_proj_weight_to_fp16_palettized, x = input_201_cast_fp16)[name = tensor("obj_247_cast_fp16")]; tensor inputs_123_cast_fp16 = add(x = inputs_121_cast_fp16, y = obj_247_cast_fp16)[name = tensor("inputs_123_cast_fp16")]; tensor var_4563 = const()[name = tensor("op_4563"), val = tensor([1])]; tensor channels_mean_123_cast_fp16 = reduce_mean(axes = var_4563, keep_dims = var_4464, x = inputs_123_cast_fp16)[name = tensor("channels_mean_123_cast_fp16")]; tensor zero_mean_123_cast_fp16 = sub(x = inputs_123_cast_fp16, y = channels_mean_123_cast_fp16)[name = tensor("zero_mean_123_cast_fp16")]; tensor zero_mean_sq_123_cast_fp16 = mul(x = zero_mean_123_cast_fp16, y = zero_mean_123_cast_fp16)[name = tensor("zero_mean_sq_123_cast_fp16")]; tensor var_4567 = const()[name = tensor("op_4567"), val = tensor([1])]; tensor var_4568_cast_fp16 = reduce_mean(axes = var_4567, keep_dims = var_4464, x = zero_mean_sq_123_cast_fp16)[name = tensor("op_4568_cast_fp16")]; tensor var_4569_to_fp16 = const()[name = tensor("op_4569_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4570_cast_fp16 = add(x = var_4568_cast_fp16, y = var_4569_to_fp16)[name = tensor("op_4570_cast_fp16")]; tensor denom_123_epsilon_0 = const()[name = tensor("denom_123_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_123_cast_fp16 = rsqrt(epsilon = denom_123_epsilon_0, x = var_4570_cast_fp16)[name = tensor("denom_123_cast_fp16")]; tensor out_123_cast_fp16 = mul(x = zero_mean_123_cast_fp16, y = denom_123_cast_fp16)[name = tensor("out_123_cast_fp16")]; tensor obj_249_gamma_0_to_fp16 = const()[name = tensor("obj_249_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(579953792)))]; tensor obj_249_beta_0_to_fp16 = const()[name = tensor("obj_249_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(579956416)))]; tensor obj_249_epsilon_0_to_fp16 = const()[name = tensor("obj_249_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_249_cast_fp16 = batch_norm(beta = obj_249_beta_0_to_fp16, epsilon = obj_249_epsilon_0_to_fp16, gamma = obj_249_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_123_cast_fp16)[name = tensor("obj_249_cast_fp16")]; tensor var_4585 = const()[name = tensor("op_4585"), val = tensor([1, 1])]; tensor var_4587 = const()[name = tensor("op_4587"), val = tensor([1, 1])]; tensor query_83_pad_type_0 = const()[name = tensor("query_83_pad_type_0"), val = tensor("custom")]; tensor query_83_pad_0 = const()[name = tensor("query_83_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_20_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(579959040))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(581597504))), name = tensor("layers_20_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_20_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_20_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(581598080)))]; tensor query_83_cast_fp16 = conv(bias = layers_20_encoder_attn_q_proj_bias_to_fp16, dilations = var_4587, groups = var_4463, pad = query_83_pad_0, pad_type = query_83_pad_type_0, strides = var_4585, weight = layers_20_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_249_cast_fp16)[name = tensor("query_83_cast_fp16")]; tensor var_4591 = const()[name = tensor("op_4591"), val = tensor([1, 1])]; tensor var_4593 = const()[name = tensor("op_4593"), val = tensor([1, 1])]; tensor key_83_pad_type_0 = const()[name = tensor("key_83_pad_type_0"), val = tensor("custom")]; tensor key_83_pad_0 = const()[name = tensor("key_83_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_20_encoder_attn_k_proj_weight_to_fp16 = const()[name = tensor("layers_20_encoder_attn_k_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(581600704)))]; tensor key_83_cast_fp16 = conv(dilations = var_4593, groups = var_4463, pad = key_83_pad_0, pad_type = key_83_pad_type_0, strides = var_4591, weight = layers_20_encoder_attn_k_proj_weight_to_fp16, x = encoder_output_embeds)[name = tensor("key_83_cast_fp16")]; tensor var_4598 = const()[name = tensor("op_4598"), val = tensor([1, 1])]; tensor var_4600 = const()[name = tensor("op_4600"), val = tensor([1, 1])]; tensor value_83_pad_type_0 = const()[name = tensor("value_83_pad_type_0"), val = tensor("custom")]; tensor value_83_pad_0 = const()[name = tensor("value_83_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_20_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(584877568))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(586106432))), name = tensor("layers_20_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_20_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_20_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(586106624)))]; tensor value_83_cast_fp16 = conv(bias = layers_20_encoder_attn_v_proj_bias_to_fp16, dilations = var_4600, groups = var_4463, pad = value_83_pad_0, pad_type = value_83_pad_type_0, strides = var_4598, weight = layers_20_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_83_cast_fp16")]; tensor var_4604 = const()[name = tensor("op_4604"), val = tensor([1, 20, 64, -1])]; tensor var_4605_cast_fp16 = reshape(shape = var_4604, x = query_83_cast_fp16)[name = tensor("op_4605_cast_fp16")]; tensor var_4606_to_fp16 = const()[name = tensor("op_4606_to_fp16"), val = tensor(0x1p-3)]; tensor var_4607_cast_fp16 = mul(x = var_4605_cast_fp16, y = var_4606_to_fp16)[name = tensor("op_4607_cast_fp16")]; tensor var_4608 = const()[name = tensor("op_4608"), val = tensor([1, 20, 64, -1])]; tensor var_4609_cast_fp16 = reshape(shape = var_4608, x = key_83_cast_fp16)[name = tensor("op_4609_cast_fp16")]; tensor mh_w_125_transpose_x_0 = const()[name = tensor("mh_w_125_transpose_x_0"), val = tensor(true)]; tensor mh_w_125_transpose_y_0 = const()[name = tensor("mh_w_125_transpose_y_0"), val = tensor(false)]; tensor mh_w_125_cast_fp16 = matmul(transpose_x = mh_w_125_transpose_x_0, transpose_y = mh_w_125_transpose_y_0, x = var_4607_cast_fp16, y = var_4609_cast_fp16)[name = tensor("mh_w_125_cast_fp16")]; tensor var_4612_cast_fp16 = softmax(axis = var_4456, x = mh_w_125_cast_fp16)[name = tensor("op_4612_cast_fp16")]; tensor var_4613 = const()[name = tensor("op_4613"), val = tensor([1, 20, 64, -1])]; tensor var_4614_cast_fp16 = reshape(shape = var_4613, x = value_83_cast_fp16)[name = tensor("op_4614_cast_fp16")]; tensor attn_83_transpose_x_0 = const()[name = tensor("attn_83_transpose_x_0"), val = tensor(false)]; tensor attn_83_transpose_y_0 = const()[name = tensor("attn_83_transpose_y_0"), val = tensor(true)]; tensor attn_83_cast_fp16 = matmul(transpose_x = attn_83_transpose_x_0, transpose_y = attn_83_transpose_y_0, x = var_4614_cast_fp16, y = var_4612_cast_fp16)[name = tensor("attn_83_cast_fp16")]; tensor var_4617 = const()[name = tensor("op_4617"), val = tensor([1, 1280, 1, -1])]; tensor input_203_cast_fp16 = reshape(shape = var_4617, x = attn_83_cast_fp16)[name = tensor("input_203_cast_fp16")]; tensor var_4621 = const()[name = tensor("op_4621"), val = tensor([1, 1])]; tensor var_4623 = const()[name = tensor("op_4623"), val = tensor([1, 1])]; tensor obj_251_pad_type_0 = const()[name = tensor("obj_251_pad_type_0"), val = tensor("custom")]; tensor obj_251_pad_0 = const()[name = tensor("obj_251_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_20_encoder_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_20_encoder_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(586109248)))]; tensor layers_20_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_20_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589386112)))]; tensor obj_251_cast_fp16 = conv(bias = layers_20_encoder_attn_o_proj_bias_to_fp16, dilations = var_4623, groups = var_4463, pad = obj_251_pad_0, pad_type = obj_251_pad_type_0, strides = var_4621, weight = layers_20_encoder_attn_o_proj_weight_to_fp16, x = input_203_cast_fp16)[name = tensor("obj_251_cast_fp16")]; tensor inputs_125_cast_fp16 = add(x = inputs_123_cast_fp16, y = obj_251_cast_fp16)[name = tensor("inputs_125_cast_fp16")]; tensor var_4629 = const()[name = tensor("op_4629"), val = tensor([1])]; tensor channels_mean_125_cast_fp16 = reduce_mean(axes = var_4629, keep_dims = var_4464, x = inputs_125_cast_fp16)[name = tensor("channels_mean_125_cast_fp16")]; tensor zero_mean_125_cast_fp16 = sub(x = inputs_125_cast_fp16, y = channels_mean_125_cast_fp16)[name = tensor("zero_mean_125_cast_fp16")]; tensor zero_mean_sq_125_cast_fp16 = mul(x = zero_mean_125_cast_fp16, y = zero_mean_125_cast_fp16)[name = tensor("zero_mean_sq_125_cast_fp16")]; tensor var_4633 = const()[name = tensor("op_4633"), val = tensor([1])]; tensor var_4634_cast_fp16 = reduce_mean(axes = var_4633, keep_dims = var_4464, x = zero_mean_sq_125_cast_fp16)[name = tensor("op_4634_cast_fp16")]; tensor var_4635_to_fp16 = const()[name = tensor("op_4635_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4636_cast_fp16 = add(x = var_4634_cast_fp16, y = var_4635_to_fp16)[name = tensor("op_4636_cast_fp16")]; tensor denom_125_epsilon_0 = const()[name = tensor("denom_125_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_125_cast_fp16 = rsqrt(epsilon = denom_125_epsilon_0, x = var_4636_cast_fp16)[name = tensor("denom_125_cast_fp16")]; tensor out_125_cast_fp16 = mul(x = zero_mean_125_cast_fp16, y = denom_125_cast_fp16)[name = tensor("out_125_cast_fp16")]; tensor input_205_gamma_0_to_fp16 = const()[name = tensor("input_205_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589388736)))]; tensor input_205_beta_0_to_fp16 = const()[name = tensor("input_205_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589391360)))]; tensor input_205_epsilon_0_to_fp16 = const()[name = tensor("input_205_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_205_cast_fp16 = batch_norm(beta = input_205_beta_0_to_fp16, epsilon = input_205_epsilon_0_to_fp16, gamma = input_205_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_125_cast_fp16)[name = tensor("input_205_cast_fp16")]; tensor var_4647 = const()[name = tensor("op_4647"), val = tensor([1, 1])]; tensor var_4649 = const()[name = tensor("op_4649"), val = tensor([1, 1])]; tensor input_207_pad_type_0 = const()[name = tensor("input_207_pad_type_0"), val = tensor("custom")]; tensor input_207_pad_0 = const()[name = tensor("input_207_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_20_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589393984))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(594309248))), name = tensor("layers_20_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_20_fc1_bias_to_fp16 = const()[name = tensor("layers_20_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(594309440)))]; tensor input_207_cast_fp16 = conv(bias = layers_20_fc1_bias_to_fp16, dilations = var_4649, groups = var_4463, pad = input_207_pad_0, pad_type = input_207_pad_type_0, strides = var_4647, weight = layers_20_fc1_weight_to_fp16_palettized, x = input_205_cast_fp16)[name = tensor("input_207_cast_fp16")]; tensor input_209_mode_0 = const()[name = tensor("input_209_mode_0"), val = tensor("EXACT")]; tensor input_209_cast_fp16 = gelu(mode = input_209_mode_0, x = input_207_cast_fp16)[name = tensor("input_209_cast_fp16")]; tensor var_4655 = const()[name = tensor("op_4655"), val = tensor([1, 1])]; tensor var_4657 = const()[name = tensor("op_4657"), val = tensor([1, 1])]; tensor hidden_states_43_pad_type_0 = const()[name = tensor("hidden_states_43_pad_type_0"), val = tensor("custom")]; tensor hidden_states_43_pad_0 = const()[name = tensor("hidden_states_43_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_20_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(594319744))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(600873408))), name = tensor("layers_20_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_20_fc2_bias_to_fp16 = const()[name = tensor("layers_20_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(600873984)))]; tensor hidden_states_43_cast_fp16 = conv(bias = layers_20_fc2_bias_to_fp16, dilations = var_4657, groups = var_4463, pad = hidden_states_43_pad_0, pad_type = hidden_states_43_pad_type_0, strides = var_4655, weight = layers_20_fc2_weight_to_fp16_palettized, x = input_209_cast_fp16)[name = tensor("hidden_states_43_cast_fp16")]; tensor inputs_127_cast_fp16 = add(x = inputs_125_cast_fp16, y = hidden_states_43_cast_fp16)[name = tensor("inputs_127_cast_fp16")]; tensor var_4670 = const()[name = tensor("op_4670"), val = tensor(3)]; tensor var_4677 = const()[name = tensor("op_4677"), val = tensor(1)]; tensor var_4678 = const()[name = tensor("op_4678"), val = tensor(true)]; tensor var_4690 = const()[name = tensor("op_4690"), val = tensor([1])]; tensor channels_mean_127_cast_fp16 = reduce_mean(axes = var_4690, keep_dims = var_4678, x = inputs_127_cast_fp16)[name = tensor("channels_mean_127_cast_fp16")]; tensor zero_mean_127_cast_fp16 = sub(x = inputs_127_cast_fp16, y = channels_mean_127_cast_fp16)[name = tensor("zero_mean_127_cast_fp16")]; tensor zero_mean_sq_127_cast_fp16 = mul(x = zero_mean_127_cast_fp16, y = zero_mean_127_cast_fp16)[name = tensor("zero_mean_sq_127_cast_fp16")]; tensor var_4694 = const()[name = tensor("op_4694"), val = tensor([1])]; tensor var_4695_cast_fp16 = reduce_mean(axes = var_4694, keep_dims = var_4678, x = zero_mean_sq_127_cast_fp16)[name = tensor("op_4695_cast_fp16")]; tensor var_4696_to_fp16 = const()[name = tensor("op_4696_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4697_cast_fp16 = add(x = var_4695_cast_fp16, y = var_4696_to_fp16)[name = tensor("op_4697_cast_fp16")]; tensor denom_127_epsilon_0 = const()[name = tensor("denom_127_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_127_cast_fp16 = rsqrt(epsilon = denom_127_epsilon_0, x = var_4697_cast_fp16)[name = tensor("denom_127_cast_fp16")]; tensor out_127_cast_fp16 = mul(x = zero_mean_127_cast_fp16, y = denom_127_cast_fp16)[name = tensor("out_127_cast_fp16")]; tensor obj_253_gamma_0_to_fp16 = const()[name = tensor("obj_253_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(600876608)))]; tensor obj_253_beta_0_to_fp16 = const()[name = tensor("obj_253_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(600879232)))]; tensor obj_253_epsilon_0_to_fp16 = const()[name = tensor("obj_253_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_253_cast_fp16 = batch_norm(beta = obj_253_beta_0_to_fp16, epsilon = obj_253_epsilon_0_to_fp16, gamma = obj_253_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_127_cast_fp16)[name = tensor("obj_253_cast_fp16")]; tensor var_4712 = const()[name = tensor("op_4712"), val = tensor([1, 1])]; tensor var_4714 = const()[name = tensor("op_4714"), val = tensor([1, 1])]; tensor query_85_pad_type_0 = const()[name = tensor("query_85_pad_type_0"), val = tensor("custom")]; tensor query_85_pad_0 = const()[name = tensor("query_85_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_21_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(600881856))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(601701120))), name = tensor("layers_21_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_21_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_21_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(601701248)))]; tensor query_85_cast_fp16 = conv(bias = layers_21_self_attn_q_proj_bias_to_fp16, dilations = var_4714, groups = var_4677, pad = query_85_pad_0, pad_type = query_85_pad_type_0, strides = var_4712, weight = layers_21_self_attn_q_proj_weight_to_fp16_palettized, x = obj_253_cast_fp16)[name = tensor("query_85_cast_fp16")]; tensor var_4718 = const()[name = tensor("op_4718"), val = tensor([1, 1])]; tensor var_4720 = const()[name = tensor("op_4720"), val = tensor([1, 1])]; tensor current_key_43_pad_type_0 = const()[name = tensor("current_key_43_pad_type_0"), val = tensor("custom")]; tensor current_key_43_pad_0 = const()[name = tensor("current_key_43_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_21_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(601703872))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(602523136))), name = tensor("layers_21_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_43_cast_fp16 = conv(dilations = var_4720, groups = var_4677, pad = current_key_43_pad_0, pad_type = current_key_43_pad_type_0, strides = var_4718, weight = layers_21_self_attn_k_proj_weight_to_fp16_palettized, x = obj_253_cast_fp16)[name = tensor("current_key_43_cast_fp16")]; tensor var_4725 = const()[name = tensor("op_4725"), val = tensor([1, 1])]; tensor var_4727 = const()[name = tensor("op_4727"), val = tensor([1, 1])]; tensor current_value_43_pad_type_0 = const()[name = tensor("current_value_43_pad_type_0"), val = tensor("custom")]; tensor current_value_43_pad_0 = const()[name = tensor("current_value_43_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_21_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(602523264))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(603342528))), name = tensor("layers_21_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_21_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_21_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(603342656)))]; tensor current_value_43_cast_fp16 = conv(bias = layers_21_self_attn_v_proj_bias_to_fp16, dilations = var_4727, groups = var_4677, pad = current_value_43_pad_0, pad_type = current_value_43_pad_type_0, strides = var_4725, weight = layers_21_self_attn_v_proj_weight_to_fp16_palettized, x = obj_253_cast_fp16)[name = tensor("current_value_43_cast_fp16")]; tensor var_4734_cast_fp16 = mul(x = current_key_43_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_4734_cast_fp16")]; tensor var_4736_cast_fp16 = mul(x = var_103_cast_fp16_21, y = var_241_cast_fp16)[name = tensor("op_4736_cast_fp16")]; tensor key_85_cast_fp16 = add(x = var_4734_cast_fp16, y = var_4736_cast_fp16)[name = tensor("key_85_cast_fp16")]; tensor var_4738_cast_fp16 = mul(x = current_value_43_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_4738_cast_fp16")]; tensor var_4740_cast_fp16 = mul(x = var_138_cast_fp16_21, y = var_241_cast_fp16)[name = tensor("op_4740_cast_fp16")]; tensor value_85_cast_fp16 = add(x = var_4738_cast_fp16, y = var_4740_cast_fp16)[name = tensor("value_85_cast_fp16")]; tensor var_4743 = const()[name = tensor("op_4743"), val = tensor([1, 20, 64, -1])]; tensor var_4744_cast_fp16 = reshape(shape = var_4743, x = query_85_cast_fp16)[name = tensor("op_4744_cast_fp16")]; tensor var_4745_to_fp16 = const()[name = tensor("op_4745_to_fp16"), val = tensor(0x1p-3)]; tensor var_4746_cast_fp16 = mul(x = var_4744_cast_fp16, y = var_4745_to_fp16)[name = tensor("op_4746_cast_fp16")]; tensor var_4747 = const()[name = tensor("op_4747"), val = tensor([1, 20, 64, -1])]; tensor var_4748_cast_fp16 = reshape(shape = var_4747, x = key_85_cast_fp16)[name = tensor("op_4748_cast_fp16")]; tensor mh_w_127_transpose_x_0 = const()[name = tensor("mh_w_127_transpose_x_0"), val = tensor(true)]; tensor mh_w_127_transpose_y_0 = const()[name = tensor("mh_w_127_transpose_y_0"), val = tensor(false)]; tensor mh_w_127_cast_fp16 = matmul(transpose_x = mh_w_127_transpose_x_0, transpose_y = mh_w_127_transpose_y_0, x = var_4746_cast_fp16, y = var_4748_cast_fp16)[name = tensor("mh_w_127_cast_fp16")]; tensor mh_w_129_cast_fp16 = add(x = mh_w_127_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_129_cast_fp16")]; tensor var_4756_cast_fp16 = softmax(axis = var_4670, x = mh_w_129_cast_fp16)[name = tensor("op_4756_cast_fp16")]; tensor var_4757 = const()[name = tensor("op_4757"), val = tensor([1, 20, 64, -1])]; tensor var_4758_cast_fp16 = reshape(shape = var_4757, x = value_85_cast_fp16)[name = tensor("op_4758_cast_fp16")]; tensor attn_85_transpose_x_0 = const()[name = tensor("attn_85_transpose_x_0"), val = tensor(false)]; tensor attn_85_transpose_y_0 = const()[name = tensor("attn_85_transpose_y_0"), val = tensor(true)]; tensor attn_85_cast_fp16 = matmul(transpose_x = attn_85_transpose_x_0, transpose_y = attn_85_transpose_y_0, x = var_4758_cast_fp16, y = var_4756_cast_fp16)[name = tensor("attn_85_cast_fp16")]; tensor var_4761 = const()[name = tensor("op_4761"), val = tensor([1, 1280, 1, -1])]; tensor input_211_cast_fp16 = reshape(shape = var_4761, x = attn_85_cast_fp16)[name = tensor("input_211_cast_fp16")]; tensor var_4765 = const()[name = tensor("op_4765"), val = tensor([1, 1])]; tensor var_4767 = const()[name = tensor("op_4767"), val = tensor([1, 1])]; tensor obj_259_pad_type_0 = const()[name = tensor("obj_259_pad_type_0"), val = tensor("custom")]; tensor obj_259_pad_0 = const()[name = tensor("obj_259_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_21_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(603345280))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604574144))), name = tensor("layers_21_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_21_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_21_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604574336)))]; tensor obj_259_cast_fp16 = conv(bias = layers_21_self_attn_o_proj_bias_to_fp16, dilations = var_4767, groups = var_4677, pad = obj_259_pad_0, pad_type = obj_259_pad_type_0, strides = var_4765, weight = layers_21_self_attn_o_proj_weight_to_fp16_palettized, x = input_211_cast_fp16)[name = tensor("obj_259_cast_fp16")]; tensor inputs_129_cast_fp16 = add(x = inputs_127_cast_fp16, y = obj_259_cast_fp16)[name = tensor("inputs_129_cast_fp16")]; tensor var_4777 = const()[name = tensor("op_4777"), val = tensor([1])]; tensor channels_mean_129_cast_fp16 = reduce_mean(axes = var_4777, keep_dims = var_4678, x = inputs_129_cast_fp16)[name = tensor("channels_mean_129_cast_fp16")]; tensor zero_mean_129_cast_fp16 = sub(x = inputs_129_cast_fp16, y = channels_mean_129_cast_fp16)[name = tensor("zero_mean_129_cast_fp16")]; tensor zero_mean_sq_129_cast_fp16 = mul(x = zero_mean_129_cast_fp16, y = zero_mean_129_cast_fp16)[name = tensor("zero_mean_sq_129_cast_fp16")]; tensor var_4781 = const()[name = tensor("op_4781"), val = tensor([1])]; tensor var_4782_cast_fp16 = reduce_mean(axes = var_4781, keep_dims = var_4678, x = zero_mean_sq_129_cast_fp16)[name = tensor("op_4782_cast_fp16")]; tensor var_4783_to_fp16 = const()[name = tensor("op_4783_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4784_cast_fp16 = add(x = var_4782_cast_fp16, y = var_4783_to_fp16)[name = tensor("op_4784_cast_fp16")]; tensor denom_129_epsilon_0 = const()[name = tensor("denom_129_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_129_cast_fp16 = rsqrt(epsilon = denom_129_epsilon_0, x = var_4784_cast_fp16)[name = tensor("denom_129_cast_fp16")]; tensor out_129_cast_fp16 = mul(x = zero_mean_129_cast_fp16, y = denom_129_cast_fp16)[name = tensor("out_129_cast_fp16")]; tensor obj_261_gamma_0_to_fp16 = const()[name = tensor("obj_261_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604576960)))]; tensor obj_261_beta_0_to_fp16 = const()[name = tensor("obj_261_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604579584)))]; tensor obj_261_epsilon_0_to_fp16 = const()[name = tensor("obj_261_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_261_cast_fp16 = batch_norm(beta = obj_261_beta_0_to_fp16, epsilon = obj_261_epsilon_0_to_fp16, gamma = obj_261_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_129_cast_fp16)[name = tensor("obj_261_cast_fp16")]; tensor var_4799 = const()[name = tensor("op_4799"), val = tensor([1, 1])]; tensor var_4801 = const()[name = tensor("op_4801"), val = tensor([1, 1])]; tensor query_87_pad_type_0 = const()[name = tensor("query_87_pad_type_0"), val = tensor("custom")]; tensor query_87_pad_0 = const()[name = tensor("query_87_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_21_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(604582208))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(605401472))), name = tensor("layers_21_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_21_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_21_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(605401600)))]; tensor query_87_cast_fp16 = conv(bias = layers_21_encoder_attn_q_proj_bias_to_fp16, dilations = var_4801, groups = var_4677, pad = query_87_pad_0, pad_type = query_87_pad_type_0, strides = var_4799, weight = layers_21_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_261_cast_fp16)[name = tensor("query_87_cast_fp16")]; tensor var_4805 = const()[name = tensor("op_4805"), val = tensor([1, 1])]; tensor var_4807 = const()[name = tensor("op_4807"), val = tensor([1, 1])]; tensor key_87_pad_type_0 = const()[name = tensor("key_87_pad_type_0"), val = tensor("custom")]; tensor key_87_pad_0 = const()[name = tensor("key_87_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_21_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(605404224))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(606633088))), name = tensor("layers_21_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_87_cast_fp16 = conv(dilations = var_4807, groups = var_4677, pad = key_87_pad_0, pad_type = key_87_pad_type_0, strides = var_4805, weight = layers_21_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_87_cast_fp16")]; tensor var_4812 = const()[name = tensor("op_4812"), val = tensor([1, 1])]; tensor var_4814 = const()[name = tensor("op_4814"), val = tensor([1, 1])]; tensor value_87_pad_type_0 = const()[name = tensor("value_87_pad_type_0"), val = tensor("custom")]; tensor value_87_pad_0 = const()[name = tensor("value_87_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_21_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(606633280))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(607452544))), name = tensor("layers_21_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_21_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_21_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(607452672)))]; tensor value_87_cast_fp16 = conv(bias = layers_21_encoder_attn_v_proj_bias_to_fp16, dilations = var_4814, groups = var_4677, pad = value_87_pad_0, pad_type = value_87_pad_type_0, strides = var_4812, weight = layers_21_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_87_cast_fp16")]; tensor var_4818 = const()[name = tensor("op_4818"), val = tensor([1, 20, 64, -1])]; tensor var_4819_cast_fp16 = reshape(shape = var_4818, x = query_87_cast_fp16)[name = tensor("op_4819_cast_fp16")]; tensor var_4820_to_fp16 = const()[name = tensor("op_4820_to_fp16"), val = tensor(0x1p-3)]; tensor var_4821_cast_fp16 = mul(x = var_4819_cast_fp16, y = var_4820_to_fp16)[name = tensor("op_4821_cast_fp16")]; tensor var_4822 = const()[name = tensor("op_4822"), val = tensor([1, 20, 64, -1])]; tensor var_4823_cast_fp16 = reshape(shape = var_4822, x = key_87_cast_fp16)[name = tensor("op_4823_cast_fp16")]; tensor mh_w_131_transpose_x_0 = const()[name = tensor("mh_w_131_transpose_x_0"), val = tensor(true)]; tensor mh_w_131_transpose_y_0 = const()[name = tensor("mh_w_131_transpose_y_0"), val = tensor(false)]; tensor mh_w_131_cast_fp16 = matmul(transpose_x = mh_w_131_transpose_x_0, transpose_y = mh_w_131_transpose_y_0, x = var_4821_cast_fp16, y = var_4823_cast_fp16)[name = tensor("mh_w_131_cast_fp16")]; tensor var_4826_cast_fp16 = softmax(axis = var_4670, x = mh_w_131_cast_fp16)[name = tensor("op_4826_cast_fp16")]; tensor var_4827 = const()[name = tensor("op_4827"), val = tensor([1, 20, 64, -1])]; tensor var_4828_cast_fp16 = reshape(shape = var_4827, x = value_87_cast_fp16)[name = tensor("op_4828_cast_fp16")]; tensor attn_87_transpose_x_0 = const()[name = tensor("attn_87_transpose_x_0"), val = tensor(false)]; tensor attn_87_transpose_y_0 = const()[name = tensor("attn_87_transpose_y_0"), val = tensor(true)]; tensor attn_87_cast_fp16 = matmul(transpose_x = attn_87_transpose_x_0, transpose_y = attn_87_transpose_y_0, x = var_4828_cast_fp16, y = var_4826_cast_fp16)[name = tensor("attn_87_cast_fp16")]; tensor var_4831 = const()[name = tensor("op_4831"), val = tensor([1, 1280, 1, -1])]; tensor input_213_cast_fp16 = reshape(shape = var_4831, x = attn_87_cast_fp16)[name = tensor("input_213_cast_fp16")]; tensor var_4835 = const()[name = tensor("op_4835"), val = tensor([1, 1])]; tensor var_4837 = const()[name = tensor("op_4837"), val = tensor([1, 1])]; tensor obj_263_pad_type_0 = const()[name = tensor("obj_263_pad_type_0"), val = tensor("custom")]; tensor obj_263_pad_0 = const()[name = tensor("obj_263_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_21_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(607455296))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(609093760))), name = tensor("layers_21_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_21_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_21_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(609094336)))]; tensor obj_263_cast_fp16 = conv(bias = layers_21_encoder_attn_o_proj_bias_to_fp16, dilations = var_4837, groups = var_4677, pad = obj_263_pad_0, pad_type = obj_263_pad_type_0, strides = var_4835, weight = layers_21_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_213_cast_fp16)[name = tensor("obj_263_cast_fp16")]; tensor inputs_131_cast_fp16 = add(x = inputs_129_cast_fp16, y = obj_263_cast_fp16)[name = tensor("inputs_131_cast_fp16")]; tensor var_4843 = const()[name = tensor("op_4843"), val = tensor([1])]; tensor channels_mean_131_cast_fp16 = reduce_mean(axes = var_4843, keep_dims = var_4678, x = inputs_131_cast_fp16)[name = tensor("channels_mean_131_cast_fp16")]; tensor zero_mean_131_cast_fp16 = sub(x = inputs_131_cast_fp16, y = channels_mean_131_cast_fp16)[name = tensor("zero_mean_131_cast_fp16")]; tensor zero_mean_sq_131_cast_fp16 = mul(x = zero_mean_131_cast_fp16, y = zero_mean_131_cast_fp16)[name = tensor("zero_mean_sq_131_cast_fp16")]; tensor var_4847 = const()[name = tensor("op_4847"), val = tensor([1])]; tensor var_4848_cast_fp16 = reduce_mean(axes = var_4847, keep_dims = var_4678, x = zero_mean_sq_131_cast_fp16)[name = tensor("op_4848_cast_fp16")]; tensor var_4849_to_fp16 = const()[name = tensor("op_4849_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4850_cast_fp16 = add(x = var_4848_cast_fp16, y = var_4849_to_fp16)[name = tensor("op_4850_cast_fp16")]; tensor denom_131_epsilon_0 = const()[name = tensor("denom_131_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_131_cast_fp16 = rsqrt(epsilon = denom_131_epsilon_0, x = var_4850_cast_fp16)[name = tensor("denom_131_cast_fp16")]; tensor out_131_cast_fp16 = mul(x = zero_mean_131_cast_fp16, y = denom_131_cast_fp16)[name = tensor("out_131_cast_fp16")]; tensor input_215_gamma_0_to_fp16 = const()[name = tensor("input_215_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(609096960)))]; tensor input_215_beta_0_to_fp16 = const()[name = tensor("input_215_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(609099584)))]; tensor input_215_epsilon_0_to_fp16 = const()[name = tensor("input_215_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_215_cast_fp16 = batch_norm(beta = input_215_beta_0_to_fp16, epsilon = input_215_epsilon_0_to_fp16, gamma = input_215_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_131_cast_fp16)[name = tensor("input_215_cast_fp16")]; tensor var_4861 = const()[name = tensor("op_4861"), val = tensor([1, 1])]; tensor var_4863 = const()[name = tensor("op_4863"), val = tensor([1, 1])]; tensor input_217_pad_type_0 = const()[name = tensor("input_217_pad_type_0"), val = tensor("custom")]; tensor input_217_pad_0 = const()[name = tensor("input_217_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_21_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(609102208))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614017472))), name = tensor("layers_21_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_21_fc1_bias_to_fp16 = const()[name = tensor("layers_21_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614017664)))]; tensor input_217_cast_fp16 = conv(bias = layers_21_fc1_bias_to_fp16, dilations = var_4863, groups = var_4677, pad = input_217_pad_0, pad_type = input_217_pad_type_0, strides = var_4861, weight = layers_21_fc1_weight_to_fp16_palettized, x = input_215_cast_fp16)[name = tensor("input_217_cast_fp16")]; tensor input_219_mode_0 = const()[name = tensor("input_219_mode_0"), val = tensor("EXACT")]; tensor input_219_cast_fp16 = gelu(mode = input_219_mode_0, x = input_217_cast_fp16)[name = tensor("input_219_cast_fp16")]; tensor var_4869 = const()[name = tensor("op_4869"), val = tensor([1, 1])]; tensor var_4871 = const()[name = tensor("op_4871"), val = tensor([1, 1])]; tensor hidden_states_45_pad_type_0 = const()[name = tensor("hidden_states_45_pad_type_0"), val = tensor("custom")]; tensor hidden_states_45_pad_0 = const()[name = tensor("hidden_states_45_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_21_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614027968))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(620581632))), name = tensor("layers_21_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_21_fc2_bias_to_fp16 = const()[name = tensor("layers_21_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(620582208)))]; tensor hidden_states_45_cast_fp16 = conv(bias = layers_21_fc2_bias_to_fp16, dilations = var_4871, groups = var_4677, pad = hidden_states_45_pad_0, pad_type = hidden_states_45_pad_type_0, strides = var_4869, weight = layers_21_fc2_weight_to_fp16_palettized, x = input_219_cast_fp16)[name = tensor("hidden_states_45_cast_fp16")]; tensor inputs_133_cast_fp16 = add(x = inputs_131_cast_fp16, y = hidden_states_45_cast_fp16)[name = tensor("inputs_133_cast_fp16")]; tensor var_4884 = const()[name = tensor("op_4884"), val = tensor(3)]; tensor var_4891 = const()[name = tensor("op_4891"), val = tensor(1)]; tensor var_4892 = const()[name = tensor("op_4892"), val = tensor(true)]; tensor var_4904 = const()[name = tensor("op_4904"), val = tensor([1])]; tensor channels_mean_133_cast_fp16 = reduce_mean(axes = var_4904, keep_dims = var_4892, x = inputs_133_cast_fp16)[name = tensor("channels_mean_133_cast_fp16")]; tensor zero_mean_133_cast_fp16 = sub(x = inputs_133_cast_fp16, y = channels_mean_133_cast_fp16)[name = tensor("zero_mean_133_cast_fp16")]; tensor zero_mean_sq_133_cast_fp16 = mul(x = zero_mean_133_cast_fp16, y = zero_mean_133_cast_fp16)[name = tensor("zero_mean_sq_133_cast_fp16")]; tensor var_4908 = const()[name = tensor("op_4908"), val = tensor([1])]; tensor var_4909_cast_fp16 = reduce_mean(axes = var_4908, keep_dims = var_4892, x = zero_mean_sq_133_cast_fp16)[name = tensor("op_4909_cast_fp16")]; tensor var_4910_to_fp16 = const()[name = tensor("op_4910_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4911_cast_fp16 = add(x = var_4909_cast_fp16, y = var_4910_to_fp16)[name = tensor("op_4911_cast_fp16")]; tensor denom_133_epsilon_0 = const()[name = tensor("denom_133_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_133_cast_fp16 = rsqrt(epsilon = denom_133_epsilon_0, x = var_4911_cast_fp16)[name = tensor("denom_133_cast_fp16")]; tensor out_133_cast_fp16 = mul(x = zero_mean_133_cast_fp16, y = denom_133_cast_fp16)[name = tensor("out_133_cast_fp16")]; tensor obj_265_gamma_0_to_fp16 = const()[name = tensor("obj_265_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(620584832)))]; tensor obj_265_beta_0_to_fp16 = const()[name = tensor("obj_265_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(620587456)))]; tensor obj_265_epsilon_0_to_fp16 = const()[name = tensor("obj_265_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_265_cast_fp16 = batch_norm(beta = obj_265_beta_0_to_fp16, epsilon = obj_265_epsilon_0_to_fp16, gamma = obj_265_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_133_cast_fp16)[name = tensor("obj_265_cast_fp16")]; tensor var_4926 = const()[name = tensor("op_4926"), val = tensor([1, 1])]; tensor var_4928 = const()[name = tensor("op_4928"), val = tensor([1, 1])]; tensor query_89_pad_type_0 = const()[name = tensor("query_89_pad_type_0"), val = tensor("custom")]; tensor query_89_pad_0 = const()[name = tensor("query_89_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_22_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(620590080))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(621818944))), name = tensor("layers_22_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_22_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_22_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(621819136)))]; tensor query_89_cast_fp16 = conv(bias = layers_22_self_attn_q_proj_bias_to_fp16, dilations = var_4928, groups = var_4891, pad = query_89_pad_0, pad_type = query_89_pad_type_0, strides = var_4926, weight = layers_22_self_attn_q_proj_weight_to_fp16_palettized, x = obj_265_cast_fp16)[name = tensor("query_89_cast_fp16")]; tensor var_4932 = const()[name = tensor("op_4932"), val = tensor([1, 1])]; tensor var_4934 = const()[name = tensor("op_4934"), val = tensor([1, 1])]; tensor current_key_45_pad_type_0 = const()[name = tensor("current_key_45_pad_type_0"), val = tensor("custom")]; tensor current_key_45_pad_0 = const()[name = tensor("current_key_45_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_22_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(621821760))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(622641024))), name = tensor("layers_22_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_45_cast_fp16 = conv(dilations = var_4934, groups = var_4891, pad = current_key_45_pad_0, pad_type = current_key_45_pad_type_0, strides = var_4932, weight = layers_22_self_attn_k_proj_weight_to_fp16_palettized, x = obj_265_cast_fp16)[name = tensor("current_key_45_cast_fp16")]; tensor var_4939 = const()[name = tensor("op_4939"), val = tensor([1, 1])]; tensor var_4941 = const()[name = tensor("op_4941"), val = tensor([1, 1])]; tensor current_value_45_pad_type_0 = const()[name = tensor("current_value_45_pad_type_0"), val = tensor("custom")]; tensor current_value_45_pad_0 = const()[name = tensor("current_value_45_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_22_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(622641152))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(623460416))), name = tensor("layers_22_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_22_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_22_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(623460544)))]; tensor current_value_45_cast_fp16 = conv(bias = layers_22_self_attn_v_proj_bias_to_fp16, dilations = var_4941, groups = var_4891, pad = current_value_45_pad_0, pad_type = current_value_45_pad_type_0, strides = var_4939, weight = layers_22_self_attn_v_proj_weight_to_fp16_palettized, x = obj_265_cast_fp16)[name = tensor("current_value_45_cast_fp16")]; tensor var_4948_cast_fp16 = mul(x = current_key_45_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_4948_cast_fp16")]; tensor var_4950_cast_fp16 = mul(x = var_103_cast_fp16_22, y = var_241_cast_fp16)[name = tensor("op_4950_cast_fp16")]; tensor key_89_cast_fp16 = add(x = var_4948_cast_fp16, y = var_4950_cast_fp16)[name = tensor("key_89_cast_fp16")]; tensor var_4952_cast_fp16 = mul(x = current_value_45_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_4952_cast_fp16")]; tensor var_4954_cast_fp16 = mul(x = var_138_cast_fp16_22, y = var_241_cast_fp16)[name = tensor("op_4954_cast_fp16")]; tensor value_89_cast_fp16 = add(x = var_4952_cast_fp16, y = var_4954_cast_fp16)[name = tensor("value_89_cast_fp16")]; tensor var_4957 = const()[name = tensor("op_4957"), val = tensor([1, 20, 64, -1])]; tensor var_4958_cast_fp16 = reshape(shape = var_4957, x = query_89_cast_fp16)[name = tensor("op_4958_cast_fp16")]; tensor var_4959_to_fp16 = const()[name = tensor("op_4959_to_fp16"), val = tensor(0x1p-3)]; tensor var_4960_cast_fp16 = mul(x = var_4958_cast_fp16, y = var_4959_to_fp16)[name = tensor("op_4960_cast_fp16")]; tensor var_4961 = const()[name = tensor("op_4961"), val = tensor([1, 20, 64, -1])]; tensor var_4962_cast_fp16 = reshape(shape = var_4961, x = key_89_cast_fp16)[name = tensor("op_4962_cast_fp16")]; tensor mh_w_133_transpose_x_0 = const()[name = tensor("mh_w_133_transpose_x_0"), val = tensor(true)]; tensor mh_w_133_transpose_y_0 = const()[name = tensor("mh_w_133_transpose_y_0"), val = tensor(false)]; tensor mh_w_133_cast_fp16 = matmul(transpose_x = mh_w_133_transpose_x_0, transpose_y = mh_w_133_transpose_y_0, x = var_4960_cast_fp16, y = var_4962_cast_fp16)[name = tensor("mh_w_133_cast_fp16")]; tensor mh_w_135_cast_fp16 = add(x = mh_w_133_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_135_cast_fp16")]; tensor var_4970_cast_fp16 = softmax(axis = var_4884, x = mh_w_135_cast_fp16)[name = tensor("op_4970_cast_fp16")]; tensor var_4971 = const()[name = tensor("op_4971"), val = tensor([1, 20, 64, -1])]; tensor var_4972_cast_fp16 = reshape(shape = var_4971, x = value_89_cast_fp16)[name = tensor("op_4972_cast_fp16")]; tensor attn_89_transpose_x_0 = const()[name = tensor("attn_89_transpose_x_0"), val = tensor(false)]; tensor attn_89_transpose_y_0 = const()[name = tensor("attn_89_transpose_y_0"), val = tensor(true)]; tensor attn_89_cast_fp16 = matmul(transpose_x = attn_89_transpose_x_0, transpose_y = attn_89_transpose_y_0, x = var_4972_cast_fp16, y = var_4970_cast_fp16)[name = tensor("attn_89_cast_fp16")]; tensor var_4975 = const()[name = tensor("op_4975"), val = tensor([1, 1280, 1, -1])]; tensor input_221_cast_fp16 = reshape(shape = var_4975, x = attn_89_cast_fp16)[name = tensor("input_221_cast_fp16")]; tensor var_4979 = const()[name = tensor("op_4979"), val = tensor([1, 1])]; tensor var_4981 = const()[name = tensor("op_4981"), val = tensor([1, 1])]; tensor obj_271_pad_type_0 = const()[name = tensor("obj_271_pad_type_0"), val = tensor("custom")]; tensor obj_271_pad_0 = const()[name = tensor("obj_271_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_22_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(623463168))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(624692032))), name = tensor("layers_22_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_22_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_22_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(624692224)))]; tensor obj_271_cast_fp16 = conv(bias = layers_22_self_attn_o_proj_bias_to_fp16, dilations = var_4981, groups = var_4891, pad = obj_271_pad_0, pad_type = obj_271_pad_type_0, strides = var_4979, weight = layers_22_self_attn_o_proj_weight_to_fp16_palettized, x = input_221_cast_fp16)[name = tensor("obj_271_cast_fp16")]; tensor inputs_135_cast_fp16 = add(x = inputs_133_cast_fp16, y = obj_271_cast_fp16)[name = tensor("inputs_135_cast_fp16")]; tensor var_4991 = const()[name = tensor("op_4991"), val = tensor([1])]; tensor channels_mean_135_cast_fp16 = reduce_mean(axes = var_4991, keep_dims = var_4892, x = inputs_135_cast_fp16)[name = tensor("channels_mean_135_cast_fp16")]; tensor zero_mean_135_cast_fp16 = sub(x = inputs_135_cast_fp16, y = channels_mean_135_cast_fp16)[name = tensor("zero_mean_135_cast_fp16")]; tensor zero_mean_sq_135_cast_fp16 = mul(x = zero_mean_135_cast_fp16, y = zero_mean_135_cast_fp16)[name = tensor("zero_mean_sq_135_cast_fp16")]; tensor var_4995 = const()[name = tensor("op_4995"), val = tensor([1])]; tensor var_4996_cast_fp16 = reduce_mean(axes = var_4995, keep_dims = var_4892, x = zero_mean_sq_135_cast_fp16)[name = tensor("op_4996_cast_fp16")]; tensor var_4997_to_fp16 = const()[name = tensor("op_4997_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4998_cast_fp16 = add(x = var_4996_cast_fp16, y = var_4997_to_fp16)[name = tensor("op_4998_cast_fp16")]; tensor denom_135_epsilon_0 = const()[name = tensor("denom_135_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_135_cast_fp16 = rsqrt(epsilon = denom_135_epsilon_0, x = var_4998_cast_fp16)[name = tensor("denom_135_cast_fp16")]; tensor out_135_cast_fp16 = mul(x = zero_mean_135_cast_fp16, y = denom_135_cast_fp16)[name = tensor("out_135_cast_fp16")]; tensor obj_273_gamma_0_to_fp16 = const()[name = tensor("obj_273_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(624694848)))]; tensor obj_273_beta_0_to_fp16 = const()[name = tensor("obj_273_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(624697472)))]; tensor obj_273_epsilon_0_to_fp16 = const()[name = tensor("obj_273_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_273_cast_fp16 = batch_norm(beta = obj_273_beta_0_to_fp16, epsilon = obj_273_epsilon_0_to_fp16, gamma = obj_273_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_135_cast_fp16)[name = tensor("obj_273_cast_fp16")]; tensor var_5013 = const()[name = tensor("op_5013"), val = tensor([1, 1])]; tensor var_5015 = const()[name = tensor("op_5015"), val = tensor([1, 1])]; tensor query_91_pad_type_0 = const()[name = tensor("query_91_pad_type_0"), val = tensor("custom")]; tensor query_91_pad_0 = const()[name = tensor("query_91_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_22_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(624700096))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(625928960))), name = tensor("layers_22_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_22_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_22_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(625929152)))]; tensor query_91_cast_fp16 = conv(bias = layers_22_encoder_attn_q_proj_bias_to_fp16, dilations = var_5015, groups = var_4891, pad = query_91_pad_0, pad_type = query_91_pad_type_0, strides = var_5013, weight = layers_22_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_273_cast_fp16)[name = tensor("query_91_cast_fp16")]; tensor var_5019 = const()[name = tensor("op_5019"), val = tensor([1, 1])]; tensor var_5021 = const()[name = tensor("op_5021"), val = tensor([1, 1])]; tensor key_91_pad_type_0 = const()[name = tensor("key_91_pad_type_0"), val = tensor("custom")]; tensor key_91_pad_0 = const()[name = tensor("key_91_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_22_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(625931776))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(626751040))), name = tensor("layers_22_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_91_cast_fp16 = conv(dilations = var_5021, groups = var_4891, pad = key_91_pad_0, pad_type = key_91_pad_type_0, strides = var_5019, weight = layers_22_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_91_cast_fp16")]; tensor var_5026 = const()[name = tensor("op_5026"), val = tensor([1, 1])]; tensor var_5028 = const()[name = tensor("op_5028"), val = tensor([1, 1])]; tensor value_91_pad_type_0 = const()[name = tensor("value_91_pad_type_0"), val = tensor("custom")]; tensor value_91_pad_0 = const()[name = tensor("value_91_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_22_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(626751168))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(627570432))), name = tensor("layers_22_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_22_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_22_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(627570560)))]; tensor value_91_cast_fp16 = conv(bias = layers_22_encoder_attn_v_proj_bias_to_fp16, dilations = var_5028, groups = var_4891, pad = value_91_pad_0, pad_type = value_91_pad_type_0, strides = var_5026, weight = layers_22_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_91_cast_fp16")]; tensor var_5032 = const()[name = tensor("op_5032"), val = tensor([1, 20, 64, -1])]; tensor var_5033_cast_fp16 = reshape(shape = var_5032, x = query_91_cast_fp16)[name = tensor("op_5033_cast_fp16")]; tensor var_5034_to_fp16 = const()[name = tensor("op_5034_to_fp16"), val = tensor(0x1p-3)]; tensor var_5035_cast_fp16 = mul(x = var_5033_cast_fp16, y = var_5034_to_fp16)[name = tensor("op_5035_cast_fp16")]; tensor var_5036 = const()[name = tensor("op_5036"), val = tensor([1, 20, 64, -1])]; tensor var_5037_cast_fp16 = reshape(shape = var_5036, x = key_91_cast_fp16)[name = tensor("op_5037_cast_fp16")]; tensor mh_w_137_transpose_x_0 = const()[name = tensor("mh_w_137_transpose_x_0"), val = tensor(true)]; tensor mh_w_137_transpose_y_0 = const()[name = tensor("mh_w_137_transpose_y_0"), val = tensor(false)]; tensor mh_w_137_cast_fp16 = matmul(transpose_x = mh_w_137_transpose_x_0, transpose_y = mh_w_137_transpose_y_0, x = var_5035_cast_fp16, y = var_5037_cast_fp16)[name = tensor("mh_w_137_cast_fp16")]; tensor var_5040_cast_fp16 = softmax(axis = var_4884, x = mh_w_137_cast_fp16)[name = tensor("op_5040_cast_fp16")]; tensor var_5041 = const()[name = tensor("op_5041"), val = tensor([1, 20, 64, -1])]; tensor var_5042_cast_fp16 = reshape(shape = var_5041, x = value_91_cast_fp16)[name = tensor("op_5042_cast_fp16")]; tensor attn_91_transpose_x_0 = const()[name = tensor("attn_91_transpose_x_0"), val = tensor(false)]; tensor attn_91_transpose_y_0 = const()[name = tensor("attn_91_transpose_y_0"), val = tensor(true)]; tensor attn_91_cast_fp16 = matmul(transpose_x = attn_91_transpose_x_0, transpose_y = attn_91_transpose_y_0, x = var_5042_cast_fp16, y = var_5040_cast_fp16)[name = tensor("attn_91_cast_fp16")]; tensor var_5045 = const()[name = tensor("op_5045"), val = tensor([1, 1280, 1, -1])]; tensor input_223_cast_fp16 = reshape(shape = var_5045, x = attn_91_cast_fp16)[name = tensor("input_223_cast_fp16")]; tensor var_5049 = const()[name = tensor("op_5049"), val = tensor([1, 1])]; tensor var_5051 = const()[name = tensor("op_5051"), val = tensor([1, 1])]; tensor obj_275_pad_type_0 = const()[name = tensor("obj_275_pad_type_0"), val = tensor("custom")]; tensor obj_275_pad_0 = const()[name = tensor("obj_275_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_22_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(627573184))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(628802048))), name = tensor("layers_22_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_22_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_22_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(628802240)))]; tensor obj_275_cast_fp16 = conv(bias = layers_22_encoder_attn_o_proj_bias_to_fp16, dilations = var_5051, groups = var_4891, pad = obj_275_pad_0, pad_type = obj_275_pad_type_0, strides = var_5049, weight = layers_22_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_223_cast_fp16)[name = tensor("obj_275_cast_fp16")]; tensor inputs_137_cast_fp16 = add(x = inputs_135_cast_fp16, y = obj_275_cast_fp16)[name = tensor("inputs_137_cast_fp16")]; tensor var_5057 = const()[name = tensor("op_5057"), val = tensor([1])]; tensor channels_mean_137_cast_fp16 = reduce_mean(axes = var_5057, keep_dims = var_4892, x = inputs_137_cast_fp16)[name = tensor("channels_mean_137_cast_fp16")]; tensor zero_mean_137_cast_fp16 = sub(x = inputs_137_cast_fp16, y = channels_mean_137_cast_fp16)[name = tensor("zero_mean_137_cast_fp16")]; tensor zero_mean_sq_137_cast_fp16 = mul(x = zero_mean_137_cast_fp16, y = zero_mean_137_cast_fp16)[name = tensor("zero_mean_sq_137_cast_fp16")]; tensor var_5061 = const()[name = tensor("op_5061"), val = tensor([1])]; tensor var_5062_cast_fp16 = reduce_mean(axes = var_5061, keep_dims = var_4892, x = zero_mean_sq_137_cast_fp16)[name = tensor("op_5062_cast_fp16")]; tensor var_5063_to_fp16 = const()[name = tensor("op_5063_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5064_cast_fp16 = add(x = var_5062_cast_fp16, y = var_5063_to_fp16)[name = tensor("op_5064_cast_fp16")]; tensor denom_137_epsilon_0 = const()[name = tensor("denom_137_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_137_cast_fp16 = rsqrt(epsilon = denom_137_epsilon_0, x = var_5064_cast_fp16)[name = tensor("denom_137_cast_fp16")]; tensor out_137_cast_fp16 = mul(x = zero_mean_137_cast_fp16, y = denom_137_cast_fp16)[name = tensor("out_137_cast_fp16")]; tensor input_225_gamma_0_to_fp16 = const()[name = tensor("input_225_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(628804864)))]; tensor input_225_beta_0_to_fp16 = const()[name = tensor("input_225_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(628807488)))]; tensor input_225_epsilon_0_to_fp16 = const()[name = tensor("input_225_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_225_cast_fp16 = batch_norm(beta = input_225_beta_0_to_fp16, epsilon = input_225_epsilon_0_to_fp16, gamma = input_225_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_137_cast_fp16)[name = tensor("input_225_cast_fp16")]; tensor var_5075 = const()[name = tensor("op_5075"), val = tensor([1, 1])]; tensor var_5077 = const()[name = tensor("op_5077"), val = tensor([1, 1])]; tensor input_227_pad_type_0 = const()[name = tensor("input_227_pad_type_0"), val = tensor("custom")]; tensor input_227_pad_0 = const()[name = tensor("input_227_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_22_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(628810112))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(633725376))), name = tensor("layers_22_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_22_fc1_bias_to_fp16 = const()[name = tensor("layers_22_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(633725568)))]; tensor input_227_cast_fp16 = conv(bias = layers_22_fc1_bias_to_fp16, dilations = var_5077, groups = var_4891, pad = input_227_pad_0, pad_type = input_227_pad_type_0, strides = var_5075, weight = layers_22_fc1_weight_to_fp16_palettized, x = input_225_cast_fp16)[name = tensor("input_227_cast_fp16")]; tensor input_229_mode_0 = const()[name = tensor("input_229_mode_0"), val = tensor("EXACT")]; tensor input_229_cast_fp16 = gelu(mode = input_229_mode_0, x = input_227_cast_fp16)[name = tensor("input_229_cast_fp16")]; tensor var_5083 = const()[name = tensor("op_5083"), val = tensor([1, 1])]; tensor var_5085 = const()[name = tensor("op_5085"), val = tensor([1, 1])]; tensor hidden_states_47_pad_type_0 = const()[name = tensor("hidden_states_47_pad_type_0"), val = tensor("custom")]; tensor hidden_states_47_pad_0 = const()[name = tensor("hidden_states_47_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_22_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(633735872))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(640289536))), name = tensor("layers_22_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_22_fc2_bias_to_fp16 = const()[name = tensor("layers_22_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(640290112)))]; tensor hidden_states_47_cast_fp16 = conv(bias = layers_22_fc2_bias_to_fp16, dilations = var_5085, groups = var_4891, pad = hidden_states_47_pad_0, pad_type = hidden_states_47_pad_type_0, strides = var_5083, weight = layers_22_fc2_weight_to_fp16_palettized, x = input_229_cast_fp16)[name = tensor("hidden_states_47_cast_fp16")]; tensor inputs_139_cast_fp16 = add(x = inputs_137_cast_fp16, y = hidden_states_47_cast_fp16)[name = tensor("inputs_139_cast_fp16")]; tensor var_5098 = const()[name = tensor("op_5098"), val = tensor(3)]; tensor var_5105 = const()[name = tensor("op_5105"), val = tensor(1)]; tensor var_5106 = const()[name = tensor("op_5106"), val = tensor(true)]; tensor var_5118 = const()[name = tensor("op_5118"), val = tensor([1])]; tensor channels_mean_139_cast_fp16 = reduce_mean(axes = var_5118, keep_dims = var_5106, x = inputs_139_cast_fp16)[name = tensor("channels_mean_139_cast_fp16")]; tensor zero_mean_139_cast_fp16 = sub(x = inputs_139_cast_fp16, y = channels_mean_139_cast_fp16)[name = tensor("zero_mean_139_cast_fp16")]; tensor zero_mean_sq_139_cast_fp16 = mul(x = zero_mean_139_cast_fp16, y = zero_mean_139_cast_fp16)[name = tensor("zero_mean_sq_139_cast_fp16")]; tensor var_5122 = const()[name = tensor("op_5122"), val = tensor([1])]; tensor var_5123_cast_fp16 = reduce_mean(axes = var_5122, keep_dims = var_5106, x = zero_mean_sq_139_cast_fp16)[name = tensor("op_5123_cast_fp16")]; tensor var_5124_to_fp16 = const()[name = tensor("op_5124_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5125_cast_fp16 = add(x = var_5123_cast_fp16, y = var_5124_to_fp16)[name = tensor("op_5125_cast_fp16")]; tensor denom_139_epsilon_0 = const()[name = tensor("denom_139_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_139_cast_fp16 = rsqrt(epsilon = denom_139_epsilon_0, x = var_5125_cast_fp16)[name = tensor("denom_139_cast_fp16")]; tensor out_139_cast_fp16 = mul(x = zero_mean_139_cast_fp16, y = denom_139_cast_fp16)[name = tensor("out_139_cast_fp16")]; tensor obj_277_gamma_0_to_fp16 = const()[name = tensor("obj_277_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(640292736)))]; tensor obj_277_beta_0_to_fp16 = const()[name = tensor("obj_277_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(640295360)))]; tensor obj_277_epsilon_0_to_fp16 = const()[name = tensor("obj_277_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_277_cast_fp16 = batch_norm(beta = obj_277_beta_0_to_fp16, epsilon = obj_277_epsilon_0_to_fp16, gamma = obj_277_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_139_cast_fp16)[name = tensor("obj_277_cast_fp16")]; tensor var_5140 = const()[name = tensor("op_5140"), val = tensor([1, 1])]; tensor var_5142 = const()[name = tensor("op_5142"), val = tensor([1, 1])]; tensor query_93_pad_type_0 = const()[name = tensor("query_93_pad_type_0"), val = tensor("custom")]; tensor query_93_pad_0 = const()[name = tensor("query_93_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_23_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(640297984))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641117248))), name = tensor("layers_23_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_23_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_23_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641117376)))]; tensor query_93_cast_fp16 = conv(bias = layers_23_self_attn_q_proj_bias_to_fp16, dilations = var_5142, groups = var_5105, pad = query_93_pad_0, pad_type = query_93_pad_type_0, strides = var_5140, weight = layers_23_self_attn_q_proj_weight_to_fp16_palettized, x = obj_277_cast_fp16)[name = tensor("query_93_cast_fp16")]; tensor var_5146 = const()[name = tensor("op_5146"), val = tensor([1, 1])]; tensor var_5148 = const()[name = tensor("op_5148"), val = tensor([1, 1])]; tensor current_key_47_pad_type_0 = const()[name = tensor("current_key_47_pad_type_0"), val = tensor("custom")]; tensor current_key_47_pad_0 = const()[name = tensor("current_key_47_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_23_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641120000))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641939264))), name = tensor("layers_23_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_47_cast_fp16 = conv(dilations = var_5148, groups = var_5105, pad = current_key_47_pad_0, pad_type = current_key_47_pad_type_0, strides = var_5146, weight = layers_23_self_attn_k_proj_weight_to_fp16_palettized, x = obj_277_cast_fp16)[name = tensor("current_key_47_cast_fp16")]; tensor var_5153 = const()[name = tensor("op_5153"), val = tensor([1, 1])]; tensor var_5155 = const()[name = tensor("op_5155"), val = tensor([1, 1])]; tensor current_value_47_pad_type_0 = const()[name = tensor("current_value_47_pad_type_0"), val = tensor("custom")]; tensor current_value_47_pad_0 = const()[name = tensor("current_value_47_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_23_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641939392))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(642758656))), name = tensor("layers_23_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_23_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_23_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(642758784)))]; tensor current_value_47_cast_fp16 = conv(bias = layers_23_self_attn_v_proj_bias_to_fp16, dilations = var_5155, groups = var_5105, pad = current_value_47_pad_0, pad_type = current_value_47_pad_type_0, strides = var_5153, weight = layers_23_self_attn_v_proj_weight_to_fp16_palettized, x = obj_277_cast_fp16)[name = tensor("current_value_47_cast_fp16")]; tensor var_5162_cast_fp16 = mul(x = current_key_47_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_5162_cast_fp16")]; tensor var_5164_cast_fp16 = mul(x = var_103_cast_fp16_23, y = var_241_cast_fp16)[name = tensor("op_5164_cast_fp16")]; tensor key_93_cast_fp16 = add(x = var_5162_cast_fp16, y = var_5164_cast_fp16)[name = tensor("key_93_cast_fp16")]; tensor var_5166_cast_fp16 = mul(x = current_value_47_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_5166_cast_fp16")]; tensor var_5168_cast_fp16 = mul(x = var_138_cast_fp16_23, y = var_241_cast_fp16)[name = tensor("op_5168_cast_fp16")]; tensor value_93_cast_fp16 = add(x = var_5166_cast_fp16, y = var_5168_cast_fp16)[name = tensor("value_93_cast_fp16")]; tensor var_5171 = const()[name = tensor("op_5171"), val = tensor([1, 20, 64, -1])]; tensor var_5172_cast_fp16 = reshape(shape = var_5171, x = query_93_cast_fp16)[name = tensor("op_5172_cast_fp16")]; tensor var_5173_to_fp16 = const()[name = tensor("op_5173_to_fp16"), val = tensor(0x1p-3)]; tensor var_5174_cast_fp16 = mul(x = var_5172_cast_fp16, y = var_5173_to_fp16)[name = tensor("op_5174_cast_fp16")]; tensor var_5175 = const()[name = tensor("op_5175"), val = tensor([1, 20, 64, -1])]; tensor var_5176_cast_fp16 = reshape(shape = var_5175, x = key_93_cast_fp16)[name = tensor("op_5176_cast_fp16")]; tensor mh_w_139_transpose_x_0 = const()[name = tensor("mh_w_139_transpose_x_0"), val = tensor(true)]; tensor mh_w_139_transpose_y_0 = const()[name = tensor("mh_w_139_transpose_y_0"), val = tensor(false)]; tensor mh_w_139_cast_fp16 = matmul(transpose_x = mh_w_139_transpose_x_0, transpose_y = mh_w_139_transpose_y_0, x = var_5174_cast_fp16, y = var_5176_cast_fp16)[name = tensor("mh_w_139_cast_fp16")]; tensor mh_w_141_cast_fp16 = add(x = mh_w_139_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_141_cast_fp16")]; tensor var_5184_cast_fp16 = softmax(axis = var_5098, x = mh_w_141_cast_fp16)[name = tensor("op_5184_cast_fp16")]; tensor var_5185 = const()[name = tensor("op_5185"), val = tensor([1, 20, 64, -1])]; tensor var_5186_cast_fp16 = reshape(shape = var_5185, x = value_93_cast_fp16)[name = tensor("op_5186_cast_fp16")]; tensor attn_93_transpose_x_0 = const()[name = tensor("attn_93_transpose_x_0"), val = tensor(false)]; tensor attn_93_transpose_y_0 = const()[name = tensor("attn_93_transpose_y_0"), val = tensor(true)]; tensor attn_93_cast_fp16 = matmul(transpose_x = attn_93_transpose_x_0, transpose_y = attn_93_transpose_y_0, x = var_5186_cast_fp16, y = var_5184_cast_fp16)[name = tensor("attn_93_cast_fp16")]; tensor var_5189 = const()[name = tensor("op_5189"), val = tensor([1, 1280, 1, -1])]; tensor input_231_cast_fp16 = reshape(shape = var_5189, x = attn_93_cast_fp16)[name = tensor("input_231_cast_fp16")]; tensor var_5193 = const()[name = tensor("op_5193"), val = tensor([1, 1])]; tensor var_5195 = const()[name = tensor("op_5195"), val = tensor([1, 1])]; tensor obj_283_pad_type_0 = const()[name = tensor("obj_283_pad_type_0"), val = tensor("custom")]; tensor obj_283_pad_0 = const()[name = tensor("obj_283_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_23_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(642761408))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(643580672))), name = tensor("layers_23_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_23_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_23_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(643580800)))]; tensor obj_283_cast_fp16 = conv(bias = layers_23_self_attn_o_proj_bias_to_fp16, dilations = var_5195, groups = var_5105, pad = obj_283_pad_0, pad_type = obj_283_pad_type_0, strides = var_5193, weight = layers_23_self_attn_o_proj_weight_to_fp16_palettized, x = input_231_cast_fp16)[name = tensor("obj_283_cast_fp16")]; tensor inputs_141_cast_fp16 = add(x = inputs_139_cast_fp16, y = obj_283_cast_fp16)[name = tensor("inputs_141_cast_fp16")]; tensor var_5205 = const()[name = tensor("op_5205"), val = tensor([1])]; tensor channels_mean_141_cast_fp16 = reduce_mean(axes = var_5205, keep_dims = var_5106, x = inputs_141_cast_fp16)[name = tensor("channels_mean_141_cast_fp16")]; tensor zero_mean_141_cast_fp16 = sub(x = inputs_141_cast_fp16, y = channels_mean_141_cast_fp16)[name = tensor("zero_mean_141_cast_fp16")]; tensor zero_mean_sq_141_cast_fp16 = mul(x = zero_mean_141_cast_fp16, y = zero_mean_141_cast_fp16)[name = tensor("zero_mean_sq_141_cast_fp16")]; tensor var_5209 = const()[name = tensor("op_5209"), val = tensor([1])]; tensor var_5210_cast_fp16 = reduce_mean(axes = var_5209, keep_dims = var_5106, x = zero_mean_sq_141_cast_fp16)[name = tensor("op_5210_cast_fp16")]; tensor var_5211_to_fp16 = const()[name = tensor("op_5211_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5212_cast_fp16 = add(x = var_5210_cast_fp16, y = var_5211_to_fp16)[name = tensor("op_5212_cast_fp16")]; tensor denom_141_epsilon_0 = const()[name = tensor("denom_141_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_141_cast_fp16 = rsqrt(epsilon = denom_141_epsilon_0, x = var_5212_cast_fp16)[name = tensor("denom_141_cast_fp16")]; tensor out_141_cast_fp16 = mul(x = zero_mean_141_cast_fp16, y = denom_141_cast_fp16)[name = tensor("out_141_cast_fp16")]; tensor obj_285_gamma_0_to_fp16 = const()[name = tensor("obj_285_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(643583424)))]; tensor obj_285_beta_0_to_fp16 = const()[name = tensor("obj_285_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(643586048)))]; tensor obj_285_epsilon_0_to_fp16 = const()[name = tensor("obj_285_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_285_cast_fp16 = batch_norm(beta = obj_285_beta_0_to_fp16, epsilon = obj_285_epsilon_0_to_fp16, gamma = obj_285_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_141_cast_fp16)[name = tensor("obj_285_cast_fp16")]; tensor var_5227 = const()[name = tensor("op_5227"), val = tensor([1, 1])]; tensor var_5229 = const()[name = tensor("op_5229"), val = tensor([1, 1])]; tensor query_95_pad_type_0 = const()[name = tensor("query_95_pad_type_0"), val = tensor("custom")]; tensor query_95_pad_0 = const()[name = tensor("query_95_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_23_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(643588672))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644817536))), name = tensor("layers_23_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_23_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_23_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644817728)))]; tensor query_95_cast_fp16 = conv(bias = layers_23_encoder_attn_q_proj_bias_to_fp16, dilations = var_5229, groups = var_5105, pad = query_95_pad_0, pad_type = query_95_pad_type_0, strides = var_5227, weight = layers_23_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_285_cast_fp16)[name = tensor("query_95_cast_fp16")]; tensor var_5233 = const()[name = tensor("op_5233"), val = tensor([1, 1])]; tensor var_5235 = const()[name = tensor("op_5235"), val = tensor([1, 1])]; tensor key_95_pad_type_0 = const()[name = tensor("key_95_pad_type_0"), val = tensor("custom")]; tensor key_95_pad_0 = const()[name = tensor("key_95_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_23_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(644820352))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(645639616))), name = tensor("layers_23_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_95_cast_fp16 = conv(dilations = var_5235, groups = var_5105, pad = key_95_pad_0, pad_type = key_95_pad_type_0, strides = var_5233, weight = layers_23_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_95_cast_fp16")]; tensor var_5240 = const()[name = tensor("op_5240"), val = tensor([1, 1])]; tensor var_5242 = const()[name = tensor("op_5242"), val = tensor([1, 1])]; tensor value_95_pad_type_0 = const()[name = tensor("value_95_pad_type_0"), val = tensor("custom")]; tensor value_95_pad_0 = const()[name = tensor("value_95_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_23_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(645639744))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(647278208))), name = tensor("layers_23_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_23_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_23_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(647278784)))]; tensor value_95_cast_fp16 = conv(bias = layers_23_encoder_attn_v_proj_bias_to_fp16, dilations = var_5242, groups = var_5105, pad = value_95_pad_0, pad_type = value_95_pad_type_0, strides = var_5240, weight = layers_23_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_95_cast_fp16")]; tensor var_5246 = const()[name = tensor("op_5246"), val = tensor([1, 20, 64, -1])]; tensor var_5247_cast_fp16 = reshape(shape = var_5246, x = query_95_cast_fp16)[name = tensor("op_5247_cast_fp16")]; tensor var_5248_to_fp16 = const()[name = tensor("op_5248_to_fp16"), val = tensor(0x1p-3)]; tensor var_5249_cast_fp16 = mul(x = var_5247_cast_fp16, y = var_5248_to_fp16)[name = tensor("op_5249_cast_fp16")]; tensor var_5250 = const()[name = tensor("op_5250"), val = tensor([1, 20, 64, -1])]; tensor var_5251_cast_fp16 = reshape(shape = var_5250, x = key_95_cast_fp16)[name = tensor("op_5251_cast_fp16")]; tensor mh_w_143_transpose_x_0 = const()[name = tensor("mh_w_143_transpose_x_0"), val = tensor(true)]; tensor mh_w_143_transpose_y_0 = const()[name = tensor("mh_w_143_transpose_y_0"), val = tensor(false)]; tensor mh_w_143_cast_fp16 = matmul(transpose_x = mh_w_143_transpose_x_0, transpose_y = mh_w_143_transpose_y_0, x = var_5249_cast_fp16, y = var_5251_cast_fp16)[name = tensor("mh_w_143_cast_fp16")]; tensor var_5254_cast_fp16 = softmax(axis = var_5098, x = mh_w_143_cast_fp16)[name = tensor("op_5254_cast_fp16")]; tensor var_5255 = const()[name = tensor("op_5255"), val = tensor([1, 20, 64, -1])]; tensor var_5256_cast_fp16 = reshape(shape = var_5255, x = value_95_cast_fp16)[name = tensor("op_5256_cast_fp16")]; tensor attn_95_transpose_x_0 = const()[name = tensor("attn_95_transpose_x_0"), val = tensor(false)]; tensor attn_95_transpose_y_0 = const()[name = tensor("attn_95_transpose_y_0"), val = tensor(true)]; tensor attn_95_cast_fp16 = matmul(transpose_x = attn_95_transpose_x_0, transpose_y = attn_95_transpose_y_0, x = var_5256_cast_fp16, y = var_5254_cast_fp16)[name = tensor("attn_95_cast_fp16")]; tensor var_5259 = const()[name = tensor("op_5259"), val = tensor([1, 1280, 1, -1])]; tensor input_233_cast_fp16 = reshape(shape = var_5259, x = attn_95_cast_fp16)[name = tensor("input_233_cast_fp16")]; tensor var_5263 = const()[name = tensor("op_5263"), val = tensor([1, 1])]; tensor var_5265 = const()[name = tensor("op_5265"), val = tensor([1, 1])]; tensor obj_287_pad_type_0 = const()[name = tensor("obj_287_pad_type_0"), val = tensor("custom")]; tensor obj_287_pad_0 = const()[name = tensor("obj_287_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_23_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(647281408))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(648510272))), name = tensor("layers_23_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_23_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_23_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(648510464)))]; tensor obj_287_cast_fp16 = conv(bias = layers_23_encoder_attn_o_proj_bias_to_fp16, dilations = var_5265, groups = var_5105, pad = obj_287_pad_0, pad_type = obj_287_pad_type_0, strides = var_5263, weight = layers_23_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_233_cast_fp16)[name = tensor("obj_287_cast_fp16")]; tensor inputs_143_cast_fp16 = add(x = inputs_141_cast_fp16, y = obj_287_cast_fp16)[name = tensor("inputs_143_cast_fp16")]; tensor var_5271 = const()[name = tensor("op_5271"), val = tensor([1])]; tensor channels_mean_143_cast_fp16 = reduce_mean(axes = var_5271, keep_dims = var_5106, x = inputs_143_cast_fp16)[name = tensor("channels_mean_143_cast_fp16")]; tensor zero_mean_143_cast_fp16 = sub(x = inputs_143_cast_fp16, y = channels_mean_143_cast_fp16)[name = tensor("zero_mean_143_cast_fp16")]; tensor zero_mean_sq_143_cast_fp16 = mul(x = zero_mean_143_cast_fp16, y = zero_mean_143_cast_fp16)[name = tensor("zero_mean_sq_143_cast_fp16")]; tensor var_5275 = const()[name = tensor("op_5275"), val = tensor([1])]; tensor var_5276_cast_fp16 = reduce_mean(axes = var_5275, keep_dims = var_5106, x = zero_mean_sq_143_cast_fp16)[name = tensor("op_5276_cast_fp16")]; tensor var_5277_to_fp16 = const()[name = tensor("op_5277_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5278_cast_fp16 = add(x = var_5276_cast_fp16, y = var_5277_to_fp16)[name = tensor("op_5278_cast_fp16")]; tensor denom_143_epsilon_0 = const()[name = tensor("denom_143_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_143_cast_fp16 = rsqrt(epsilon = denom_143_epsilon_0, x = var_5278_cast_fp16)[name = tensor("denom_143_cast_fp16")]; tensor out_143_cast_fp16 = mul(x = zero_mean_143_cast_fp16, y = denom_143_cast_fp16)[name = tensor("out_143_cast_fp16")]; tensor input_235_gamma_0_to_fp16 = const()[name = tensor("input_235_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(648513088)))]; tensor input_235_beta_0_to_fp16 = const()[name = tensor("input_235_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(648515712)))]; tensor input_235_epsilon_0_to_fp16 = const()[name = tensor("input_235_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_235_cast_fp16 = batch_norm(beta = input_235_beta_0_to_fp16, epsilon = input_235_epsilon_0_to_fp16, gamma = input_235_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_143_cast_fp16)[name = tensor("input_235_cast_fp16")]; tensor var_5289 = const()[name = tensor("op_5289"), val = tensor([1, 1])]; tensor var_5291 = const()[name = tensor("op_5291"), val = tensor([1, 1])]; tensor input_237_pad_type_0 = const()[name = tensor("input_237_pad_type_0"), val = tensor("custom")]; tensor input_237_pad_0 = const()[name = tensor("input_237_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_23_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(648518336))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(653433600))), name = tensor("layers_23_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_23_fc1_bias_to_fp16 = const()[name = tensor("layers_23_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(653433792)))]; tensor input_237_cast_fp16 = conv(bias = layers_23_fc1_bias_to_fp16, dilations = var_5291, groups = var_5105, pad = input_237_pad_0, pad_type = input_237_pad_type_0, strides = var_5289, weight = layers_23_fc1_weight_to_fp16_palettized, x = input_235_cast_fp16)[name = tensor("input_237_cast_fp16")]; tensor input_239_mode_0 = const()[name = tensor("input_239_mode_0"), val = tensor("EXACT")]; tensor input_239_cast_fp16 = gelu(mode = input_239_mode_0, x = input_237_cast_fp16)[name = tensor("input_239_cast_fp16")]; tensor var_5297 = const()[name = tensor("op_5297"), val = tensor([1, 1])]; tensor var_5299 = const()[name = tensor("op_5299"), val = tensor([1, 1])]; tensor hidden_states_49_pad_type_0 = const()[name = tensor("hidden_states_49_pad_type_0"), val = tensor("custom")]; tensor hidden_states_49_pad_0 = const()[name = tensor("hidden_states_49_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_23_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(653444096))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(658359360))), name = tensor("layers_23_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_23_fc2_bias_to_fp16 = const()[name = tensor("layers_23_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(658359552)))]; tensor hidden_states_49_cast_fp16 = conv(bias = layers_23_fc2_bias_to_fp16, dilations = var_5299, groups = var_5105, pad = hidden_states_49_pad_0, pad_type = hidden_states_49_pad_type_0, strides = var_5297, weight = layers_23_fc2_weight_to_fp16_palettized, x = input_239_cast_fp16)[name = tensor("hidden_states_49_cast_fp16")]; tensor inputs_145_cast_fp16 = add(x = inputs_143_cast_fp16, y = hidden_states_49_cast_fp16)[name = tensor("inputs_145_cast_fp16")]; tensor var_5312 = const()[name = tensor("op_5312"), val = tensor(3)]; tensor var_5319 = const()[name = tensor("op_5319"), val = tensor(1)]; tensor var_5320 = const()[name = tensor("op_5320"), val = tensor(true)]; tensor var_5332 = const()[name = tensor("op_5332"), val = tensor([1])]; tensor channels_mean_145_cast_fp16 = reduce_mean(axes = var_5332, keep_dims = var_5320, x = inputs_145_cast_fp16)[name = tensor("channels_mean_145_cast_fp16")]; tensor zero_mean_145_cast_fp16 = sub(x = inputs_145_cast_fp16, y = channels_mean_145_cast_fp16)[name = tensor("zero_mean_145_cast_fp16")]; tensor zero_mean_sq_145_cast_fp16 = mul(x = zero_mean_145_cast_fp16, y = zero_mean_145_cast_fp16)[name = tensor("zero_mean_sq_145_cast_fp16")]; tensor var_5336 = const()[name = tensor("op_5336"), val = tensor([1])]; tensor var_5337_cast_fp16 = reduce_mean(axes = var_5336, keep_dims = var_5320, x = zero_mean_sq_145_cast_fp16)[name = tensor("op_5337_cast_fp16")]; tensor var_5338_to_fp16 = const()[name = tensor("op_5338_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5339_cast_fp16 = add(x = var_5337_cast_fp16, y = var_5338_to_fp16)[name = tensor("op_5339_cast_fp16")]; tensor denom_145_epsilon_0 = const()[name = tensor("denom_145_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_145_cast_fp16 = rsqrt(epsilon = denom_145_epsilon_0, x = var_5339_cast_fp16)[name = tensor("denom_145_cast_fp16")]; tensor out_145_cast_fp16 = mul(x = zero_mean_145_cast_fp16, y = denom_145_cast_fp16)[name = tensor("out_145_cast_fp16")]; tensor obj_289_gamma_0_to_fp16 = const()[name = tensor("obj_289_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(658362176)))]; tensor obj_289_beta_0_to_fp16 = const()[name = tensor("obj_289_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(658364800)))]; tensor obj_289_epsilon_0_to_fp16 = const()[name = tensor("obj_289_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_289_cast_fp16 = batch_norm(beta = obj_289_beta_0_to_fp16, epsilon = obj_289_epsilon_0_to_fp16, gamma = obj_289_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_145_cast_fp16)[name = tensor("obj_289_cast_fp16")]; tensor var_5354 = const()[name = tensor("op_5354"), val = tensor([1, 1])]; tensor var_5356 = const()[name = tensor("op_5356"), val = tensor([1, 1])]; tensor query_97_pad_type_0 = const()[name = tensor("query_97_pad_type_0"), val = tensor("custom")]; tensor query_97_pad_0 = const()[name = tensor("query_97_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_24_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(658367424))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(659186688))), name = tensor("layers_24_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_24_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_24_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(659186816)))]; tensor query_97_cast_fp16 = conv(bias = layers_24_self_attn_q_proj_bias_to_fp16, dilations = var_5356, groups = var_5319, pad = query_97_pad_0, pad_type = query_97_pad_type_0, strides = var_5354, weight = layers_24_self_attn_q_proj_weight_to_fp16_palettized, x = obj_289_cast_fp16)[name = tensor("query_97_cast_fp16")]; tensor var_5360 = const()[name = tensor("op_5360"), val = tensor([1, 1])]; tensor var_5362 = const()[name = tensor("op_5362"), val = tensor([1, 1])]; tensor current_key_49_pad_type_0 = const()[name = tensor("current_key_49_pad_type_0"), val = tensor("custom")]; tensor current_key_49_pad_0 = const()[name = tensor("current_key_49_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_24_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(659189440))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(660008704))), name = tensor("layers_24_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_49_cast_fp16 = conv(dilations = var_5362, groups = var_5319, pad = current_key_49_pad_0, pad_type = current_key_49_pad_type_0, strides = var_5360, weight = layers_24_self_attn_k_proj_weight_to_fp16_palettized, x = obj_289_cast_fp16)[name = tensor("current_key_49_cast_fp16")]; tensor var_5367 = const()[name = tensor("op_5367"), val = tensor([1, 1])]; tensor var_5369 = const()[name = tensor("op_5369"), val = tensor([1, 1])]; tensor current_value_49_pad_type_0 = const()[name = tensor("current_value_49_pad_type_0"), val = tensor("custom")]; tensor current_value_49_pad_0 = const()[name = tensor("current_value_49_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_24_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(660008832))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(660828096))), name = tensor("layers_24_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_24_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_24_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(660828224)))]; tensor current_value_49_cast_fp16 = conv(bias = layers_24_self_attn_v_proj_bias_to_fp16, dilations = var_5369, groups = var_5319, pad = current_value_49_pad_0, pad_type = current_value_49_pad_type_0, strides = var_5367, weight = layers_24_self_attn_v_proj_weight_to_fp16_palettized, x = obj_289_cast_fp16)[name = tensor("current_value_49_cast_fp16")]; tensor var_5376_cast_fp16 = mul(x = current_key_49_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_5376_cast_fp16")]; tensor var_5378_cast_fp16 = mul(x = var_103_cast_fp16_24, y = var_241_cast_fp16)[name = tensor("op_5378_cast_fp16")]; tensor key_97_cast_fp16 = add(x = var_5376_cast_fp16, y = var_5378_cast_fp16)[name = tensor("key_97_cast_fp16")]; tensor var_5380_cast_fp16 = mul(x = current_value_49_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_5380_cast_fp16")]; tensor var_5382_cast_fp16 = mul(x = var_138_cast_fp16_24, y = var_241_cast_fp16)[name = tensor("op_5382_cast_fp16")]; tensor value_97_cast_fp16 = add(x = var_5380_cast_fp16, y = var_5382_cast_fp16)[name = tensor("value_97_cast_fp16")]; tensor var_5385 = const()[name = tensor("op_5385"), val = tensor([1, 20, 64, -1])]; tensor var_5386_cast_fp16 = reshape(shape = var_5385, x = query_97_cast_fp16)[name = tensor("op_5386_cast_fp16")]; tensor var_5387_to_fp16 = const()[name = tensor("op_5387_to_fp16"), val = tensor(0x1p-3)]; tensor var_5388_cast_fp16 = mul(x = var_5386_cast_fp16, y = var_5387_to_fp16)[name = tensor("op_5388_cast_fp16")]; tensor var_5389 = const()[name = tensor("op_5389"), val = tensor([1, 20, 64, -1])]; tensor var_5390_cast_fp16 = reshape(shape = var_5389, x = key_97_cast_fp16)[name = tensor("op_5390_cast_fp16")]; tensor mh_w_145_transpose_x_0 = const()[name = tensor("mh_w_145_transpose_x_0"), val = tensor(true)]; tensor mh_w_145_transpose_y_0 = const()[name = tensor("mh_w_145_transpose_y_0"), val = tensor(false)]; tensor mh_w_145_cast_fp16 = matmul(transpose_x = mh_w_145_transpose_x_0, transpose_y = mh_w_145_transpose_y_0, x = var_5388_cast_fp16, y = var_5390_cast_fp16)[name = tensor("mh_w_145_cast_fp16")]; tensor mh_w_147_cast_fp16 = add(x = mh_w_145_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_147_cast_fp16")]; tensor var_5398_cast_fp16 = softmax(axis = var_5312, x = mh_w_147_cast_fp16)[name = tensor("op_5398_cast_fp16")]; tensor var_5399 = const()[name = tensor("op_5399"), val = tensor([1, 20, 64, -1])]; tensor var_5400_cast_fp16 = reshape(shape = var_5399, x = value_97_cast_fp16)[name = tensor("op_5400_cast_fp16")]; tensor attn_97_transpose_x_0 = const()[name = tensor("attn_97_transpose_x_0"), val = tensor(false)]; tensor attn_97_transpose_y_0 = const()[name = tensor("attn_97_transpose_y_0"), val = tensor(true)]; tensor attn_97_cast_fp16 = matmul(transpose_x = attn_97_transpose_x_0, transpose_y = attn_97_transpose_y_0, x = var_5400_cast_fp16, y = var_5398_cast_fp16)[name = tensor("attn_97_cast_fp16")]; tensor var_5403 = const()[name = tensor("op_5403"), val = tensor([1, 1280, 1, -1])]; tensor input_241_cast_fp16 = reshape(shape = var_5403, x = attn_97_cast_fp16)[name = tensor("input_241_cast_fp16")]; tensor var_5407 = const()[name = tensor("op_5407"), val = tensor([1, 1])]; tensor var_5409 = const()[name = tensor("op_5409"), val = tensor([1, 1])]; tensor obj_295_pad_type_0 = const()[name = tensor("obj_295_pad_type_0"), val = tensor("custom")]; tensor obj_295_pad_0 = const()[name = tensor("obj_295_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_24_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(660830848))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(662059712))), name = tensor("layers_24_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_24_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_24_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(662059904)))]; tensor obj_295_cast_fp16 = conv(bias = layers_24_self_attn_o_proj_bias_to_fp16, dilations = var_5409, groups = var_5319, pad = obj_295_pad_0, pad_type = obj_295_pad_type_0, strides = var_5407, weight = layers_24_self_attn_o_proj_weight_to_fp16_palettized, x = input_241_cast_fp16)[name = tensor("obj_295_cast_fp16")]; tensor inputs_147_cast_fp16 = add(x = inputs_145_cast_fp16, y = obj_295_cast_fp16)[name = tensor("inputs_147_cast_fp16")]; tensor var_5419 = const()[name = tensor("op_5419"), val = tensor([1])]; tensor channels_mean_147_cast_fp16 = reduce_mean(axes = var_5419, keep_dims = var_5320, x = inputs_147_cast_fp16)[name = tensor("channels_mean_147_cast_fp16")]; tensor zero_mean_147_cast_fp16 = sub(x = inputs_147_cast_fp16, y = channels_mean_147_cast_fp16)[name = tensor("zero_mean_147_cast_fp16")]; tensor zero_mean_sq_147_cast_fp16 = mul(x = zero_mean_147_cast_fp16, y = zero_mean_147_cast_fp16)[name = tensor("zero_mean_sq_147_cast_fp16")]; tensor var_5423 = const()[name = tensor("op_5423"), val = tensor([1])]; tensor var_5424_cast_fp16 = reduce_mean(axes = var_5423, keep_dims = var_5320, x = zero_mean_sq_147_cast_fp16)[name = tensor("op_5424_cast_fp16")]; tensor var_5425_to_fp16 = const()[name = tensor("op_5425_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5426_cast_fp16 = add(x = var_5424_cast_fp16, y = var_5425_to_fp16)[name = tensor("op_5426_cast_fp16")]; tensor denom_147_epsilon_0 = const()[name = tensor("denom_147_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_147_cast_fp16 = rsqrt(epsilon = denom_147_epsilon_0, x = var_5426_cast_fp16)[name = tensor("denom_147_cast_fp16")]; tensor out_147_cast_fp16 = mul(x = zero_mean_147_cast_fp16, y = denom_147_cast_fp16)[name = tensor("out_147_cast_fp16")]; tensor obj_297_gamma_0_to_fp16 = const()[name = tensor("obj_297_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(662062528)))]; tensor obj_297_beta_0_to_fp16 = const()[name = tensor("obj_297_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(662065152)))]; tensor obj_297_epsilon_0_to_fp16 = const()[name = tensor("obj_297_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_297_cast_fp16 = batch_norm(beta = obj_297_beta_0_to_fp16, epsilon = obj_297_epsilon_0_to_fp16, gamma = obj_297_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_147_cast_fp16)[name = tensor("obj_297_cast_fp16")]; tensor var_5441 = const()[name = tensor("op_5441"), val = tensor([1, 1])]; tensor var_5443 = const()[name = tensor("op_5443"), val = tensor([1, 1])]; tensor query_99_pad_type_0 = const()[name = tensor("query_99_pad_type_0"), val = tensor("custom")]; tensor query_99_pad_0 = const()[name = tensor("query_99_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_24_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(662067776))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(663296640))), name = tensor("layers_24_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_24_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_24_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(663296832)))]; tensor query_99_cast_fp16 = conv(bias = layers_24_encoder_attn_q_proj_bias_to_fp16, dilations = var_5443, groups = var_5319, pad = query_99_pad_0, pad_type = query_99_pad_type_0, strides = var_5441, weight = layers_24_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_297_cast_fp16)[name = tensor("query_99_cast_fp16")]; tensor var_5447 = const()[name = tensor("op_5447"), val = tensor([1, 1])]; tensor var_5449 = const()[name = tensor("op_5449"), val = tensor([1, 1])]; tensor key_99_pad_type_0 = const()[name = tensor("key_99_pad_type_0"), val = tensor("custom")]; tensor key_99_pad_0 = const()[name = tensor("key_99_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_24_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(663299456))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(664528320))), name = tensor("layers_24_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_99_cast_fp16 = conv(dilations = var_5449, groups = var_5319, pad = key_99_pad_0, pad_type = key_99_pad_type_0, strides = var_5447, weight = layers_24_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_99_cast_fp16")]; tensor var_5454 = const()[name = tensor("op_5454"), val = tensor([1, 1])]; tensor var_5456 = const()[name = tensor("op_5456"), val = tensor([1, 1])]; tensor value_99_pad_type_0 = const()[name = tensor("value_99_pad_type_0"), val = tensor("custom")]; tensor value_99_pad_0 = const()[name = tensor("value_99_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_24_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(664528512))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(665757376))), name = tensor("layers_24_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_24_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_24_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(665757568)))]; tensor value_99_cast_fp16 = conv(bias = layers_24_encoder_attn_v_proj_bias_to_fp16, dilations = var_5456, groups = var_5319, pad = value_99_pad_0, pad_type = value_99_pad_type_0, strides = var_5454, weight = layers_24_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_99_cast_fp16")]; tensor var_5460 = const()[name = tensor("op_5460"), val = tensor([1, 20, 64, -1])]; tensor var_5461_cast_fp16 = reshape(shape = var_5460, x = query_99_cast_fp16)[name = tensor("op_5461_cast_fp16")]; tensor var_5462_to_fp16 = const()[name = tensor("op_5462_to_fp16"), val = tensor(0x1p-3)]; tensor var_5463_cast_fp16 = mul(x = var_5461_cast_fp16, y = var_5462_to_fp16)[name = tensor("op_5463_cast_fp16")]; tensor var_5464 = const()[name = tensor("op_5464"), val = tensor([1, 20, 64, -1])]; tensor var_5465_cast_fp16 = reshape(shape = var_5464, x = key_99_cast_fp16)[name = tensor("op_5465_cast_fp16")]; tensor mh_w_149_transpose_x_0 = const()[name = tensor("mh_w_149_transpose_x_0"), val = tensor(true)]; tensor mh_w_149_transpose_y_0 = const()[name = tensor("mh_w_149_transpose_y_0"), val = tensor(false)]; tensor mh_w_149_cast_fp16 = matmul(transpose_x = mh_w_149_transpose_x_0, transpose_y = mh_w_149_transpose_y_0, x = var_5463_cast_fp16, y = var_5465_cast_fp16)[name = tensor("mh_w_149_cast_fp16")]; tensor var_5468_cast_fp16 = softmax(axis = var_5312, x = mh_w_149_cast_fp16)[name = tensor("op_5468_cast_fp16")]; tensor var_5469 = const()[name = tensor("op_5469"), val = tensor([1, 20, 64, -1])]; tensor var_5470_cast_fp16 = reshape(shape = var_5469, x = value_99_cast_fp16)[name = tensor("op_5470_cast_fp16")]; tensor attn_99_transpose_x_0 = const()[name = tensor("attn_99_transpose_x_0"), val = tensor(false)]; tensor attn_99_transpose_y_0 = const()[name = tensor("attn_99_transpose_y_0"), val = tensor(true)]; tensor attn_99_cast_fp16 = matmul(transpose_x = attn_99_transpose_x_0, transpose_y = attn_99_transpose_y_0, x = var_5470_cast_fp16, y = var_5468_cast_fp16)[name = tensor("attn_99_cast_fp16")]; tensor var_5473 = const()[name = tensor("op_5473"), val = tensor([1, 1280, 1, -1])]; tensor input_243_cast_fp16 = reshape(shape = var_5473, x = attn_99_cast_fp16)[name = tensor("input_243_cast_fp16")]; tensor var_5477 = const()[name = tensor("op_5477"), val = tensor([1, 1])]; tensor var_5479 = const()[name = tensor("op_5479"), val = tensor([1, 1])]; tensor obj_299_pad_type_0 = const()[name = tensor("obj_299_pad_type_0"), val = tensor("custom")]; tensor obj_299_pad_0 = const()[name = tensor("obj_299_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_24_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(665760192))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(666989056))), name = tensor("layers_24_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_24_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_24_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(666989248)))]; tensor obj_299_cast_fp16 = conv(bias = layers_24_encoder_attn_o_proj_bias_to_fp16, dilations = var_5479, groups = var_5319, pad = obj_299_pad_0, pad_type = obj_299_pad_type_0, strides = var_5477, weight = layers_24_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_243_cast_fp16)[name = tensor("obj_299_cast_fp16")]; tensor inputs_149_cast_fp16 = add(x = inputs_147_cast_fp16, y = obj_299_cast_fp16)[name = tensor("inputs_149_cast_fp16")]; tensor var_5485 = const()[name = tensor("op_5485"), val = tensor([1])]; tensor channels_mean_149_cast_fp16 = reduce_mean(axes = var_5485, keep_dims = var_5320, x = inputs_149_cast_fp16)[name = tensor("channels_mean_149_cast_fp16")]; tensor zero_mean_149_cast_fp16 = sub(x = inputs_149_cast_fp16, y = channels_mean_149_cast_fp16)[name = tensor("zero_mean_149_cast_fp16")]; tensor zero_mean_sq_149_cast_fp16 = mul(x = zero_mean_149_cast_fp16, y = zero_mean_149_cast_fp16)[name = tensor("zero_mean_sq_149_cast_fp16")]; tensor var_5489 = const()[name = tensor("op_5489"), val = tensor([1])]; tensor var_5490_cast_fp16 = reduce_mean(axes = var_5489, keep_dims = var_5320, x = zero_mean_sq_149_cast_fp16)[name = tensor("op_5490_cast_fp16")]; tensor var_5491_to_fp16 = const()[name = tensor("op_5491_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5492_cast_fp16 = add(x = var_5490_cast_fp16, y = var_5491_to_fp16)[name = tensor("op_5492_cast_fp16")]; tensor denom_149_epsilon_0 = const()[name = tensor("denom_149_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_149_cast_fp16 = rsqrt(epsilon = denom_149_epsilon_0, x = var_5492_cast_fp16)[name = tensor("denom_149_cast_fp16")]; tensor out_149_cast_fp16 = mul(x = zero_mean_149_cast_fp16, y = denom_149_cast_fp16)[name = tensor("out_149_cast_fp16")]; tensor input_245_gamma_0_to_fp16 = const()[name = tensor("input_245_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(666991872)))]; tensor input_245_beta_0_to_fp16 = const()[name = tensor("input_245_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(666994496)))]; tensor input_245_epsilon_0_to_fp16 = const()[name = tensor("input_245_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_245_cast_fp16 = batch_norm(beta = input_245_beta_0_to_fp16, epsilon = input_245_epsilon_0_to_fp16, gamma = input_245_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_149_cast_fp16)[name = tensor("input_245_cast_fp16")]; tensor var_5503 = const()[name = tensor("op_5503"), val = tensor([1, 1])]; tensor var_5505 = const()[name = tensor("op_5505"), val = tensor([1, 1])]; tensor input_247_pad_type_0 = const()[name = tensor("input_247_pad_type_0"), val = tensor("custom")]; tensor input_247_pad_0 = const()[name = tensor("input_247_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_24_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(666997120))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(671912384))), name = tensor("layers_24_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_24_fc1_bias_to_fp16 = const()[name = tensor("layers_24_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(671912576)))]; tensor input_247_cast_fp16 = conv(bias = layers_24_fc1_bias_to_fp16, dilations = var_5505, groups = var_5319, pad = input_247_pad_0, pad_type = input_247_pad_type_0, strides = var_5503, weight = layers_24_fc1_weight_to_fp16_palettized, x = input_245_cast_fp16)[name = tensor("input_247_cast_fp16")]; tensor input_249_mode_0 = const()[name = tensor("input_249_mode_0"), val = tensor("EXACT")]; tensor input_249_cast_fp16 = gelu(mode = input_249_mode_0, x = input_247_cast_fp16)[name = tensor("input_249_cast_fp16")]; tensor var_5511 = const()[name = tensor("op_5511"), val = tensor([1, 1])]; tensor var_5513 = const()[name = tensor("op_5513"), val = tensor([1, 1])]; tensor hidden_states_51_pad_type_0 = const()[name = tensor("hidden_states_51_pad_type_0"), val = tensor("custom")]; tensor hidden_states_51_pad_0 = const()[name = tensor("hidden_states_51_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_24_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(671922880))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(676838144))), name = tensor("layers_24_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_24_fc2_bias_to_fp16 = const()[name = tensor("layers_24_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(676838336)))]; tensor hidden_states_51_cast_fp16 = conv(bias = layers_24_fc2_bias_to_fp16, dilations = var_5513, groups = var_5319, pad = hidden_states_51_pad_0, pad_type = hidden_states_51_pad_type_0, strides = var_5511, weight = layers_24_fc2_weight_to_fp16_palettized, x = input_249_cast_fp16)[name = tensor("hidden_states_51_cast_fp16")]; tensor inputs_151_cast_fp16 = add(x = inputs_149_cast_fp16, y = hidden_states_51_cast_fp16)[name = tensor("inputs_151_cast_fp16")]; tensor var_5526 = const()[name = tensor("op_5526"), val = tensor(3)]; tensor var_5533 = const()[name = tensor("op_5533"), val = tensor(1)]; tensor var_5534 = const()[name = tensor("op_5534"), val = tensor(true)]; tensor var_5546 = const()[name = tensor("op_5546"), val = tensor([1])]; tensor channels_mean_151_cast_fp16 = reduce_mean(axes = var_5546, keep_dims = var_5534, x = inputs_151_cast_fp16)[name = tensor("channels_mean_151_cast_fp16")]; tensor zero_mean_151_cast_fp16 = sub(x = inputs_151_cast_fp16, y = channels_mean_151_cast_fp16)[name = tensor("zero_mean_151_cast_fp16")]; tensor zero_mean_sq_151_cast_fp16 = mul(x = zero_mean_151_cast_fp16, y = zero_mean_151_cast_fp16)[name = tensor("zero_mean_sq_151_cast_fp16")]; tensor var_5550 = const()[name = tensor("op_5550"), val = tensor([1])]; tensor var_5551_cast_fp16 = reduce_mean(axes = var_5550, keep_dims = var_5534, x = zero_mean_sq_151_cast_fp16)[name = tensor("op_5551_cast_fp16")]; tensor var_5552_to_fp16 = const()[name = tensor("op_5552_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5553_cast_fp16 = add(x = var_5551_cast_fp16, y = var_5552_to_fp16)[name = tensor("op_5553_cast_fp16")]; tensor denom_151_epsilon_0 = const()[name = tensor("denom_151_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_151_cast_fp16 = rsqrt(epsilon = denom_151_epsilon_0, x = var_5553_cast_fp16)[name = tensor("denom_151_cast_fp16")]; tensor out_151_cast_fp16 = mul(x = zero_mean_151_cast_fp16, y = denom_151_cast_fp16)[name = tensor("out_151_cast_fp16")]; tensor obj_301_gamma_0_to_fp16 = const()[name = tensor("obj_301_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(676840960)))]; tensor obj_301_beta_0_to_fp16 = const()[name = tensor("obj_301_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(676843584)))]; tensor obj_301_epsilon_0_to_fp16 = const()[name = tensor("obj_301_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_301_cast_fp16 = batch_norm(beta = obj_301_beta_0_to_fp16, epsilon = obj_301_epsilon_0_to_fp16, gamma = obj_301_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_151_cast_fp16)[name = tensor("obj_301_cast_fp16")]; tensor var_5568 = const()[name = tensor("op_5568"), val = tensor([1, 1])]; tensor var_5570 = const()[name = tensor("op_5570"), val = tensor([1, 1])]; tensor query_101_pad_type_0 = const()[name = tensor("query_101_pad_type_0"), val = tensor("custom")]; tensor query_101_pad_0 = const()[name = tensor("query_101_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_25_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(676846208))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(677665472))), name = tensor("layers_25_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_25_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_25_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(677665600)))]; tensor query_101_cast_fp16 = conv(bias = layers_25_self_attn_q_proj_bias_to_fp16, dilations = var_5570, groups = var_5533, pad = query_101_pad_0, pad_type = query_101_pad_type_0, strides = var_5568, weight = layers_25_self_attn_q_proj_weight_to_fp16_palettized, x = obj_301_cast_fp16)[name = tensor("query_101_cast_fp16")]; tensor var_5574 = const()[name = tensor("op_5574"), val = tensor([1, 1])]; tensor var_5576 = const()[name = tensor("op_5576"), val = tensor([1, 1])]; tensor current_key_51_pad_type_0 = const()[name = tensor("current_key_51_pad_type_0"), val = tensor("custom")]; tensor current_key_51_pad_0 = const()[name = tensor("current_key_51_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_25_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(677668224))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(678897088))), name = tensor("layers_25_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_51_cast_fp16 = conv(dilations = var_5576, groups = var_5533, pad = current_key_51_pad_0, pad_type = current_key_51_pad_type_0, strides = var_5574, weight = layers_25_self_attn_k_proj_weight_to_fp16_palettized, x = obj_301_cast_fp16)[name = tensor("current_key_51_cast_fp16")]; tensor var_5581 = const()[name = tensor("op_5581"), val = tensor([1, 1])]; tensor var_5583 = const()[name = tensor("op_5583"), val = tensor([1, 1])]; tensor current_value_51_pad_type_0 = const()[name = tensor("current_value_51_pad_type_0"), val = tensor("custom")]; tensor current_value_51_pad_0 = const()[name = tensor("current_value_51_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_25_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(678897280))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(679716544))), name = tensor("layers_25_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_25_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_25_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(679716672)))]; tensor current_value_51_cast_fp16 = conv(bias = layers_25_self_attn_v_proj_bias_to_fp16, dilations = var_5583, groups = var_5533, pad = current_value_51_pad_0, pad_type = current_value_51_pad_type_0, strides = var_5581, weight = layers_25_self_attn_v_proj_weight_to_fp16_palettized, x = obj_301_cast_fp16)[name = tensor("current_value_51_cast_fp16")]; tensor var_5590_cast_fp16 = mul(x = current_key_51_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_5590_cast_fp16")]; tensor var_5592_cast_fp16 = mul(x = var_103_cast_fp16_25, y = var_241_cast_fp16)[name = tensor("op_5592_cast_fp16")]; tensor key_101_cast_fp16 = add(x = var_5590_cast_fp16, y = var_5592_cast_fp16)[name = tensor("key_101_cast_fp16")]; tensor var_5594_cast_fp16 = mul(x = current_value_51_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_5594_cast_fp16")]; tensor var_5596_cast_fp16 = mul(x = var_138_cast_fp16_25, y = var_241_cast_fp16)[name = tensor("op_5596_cast_fp16")]; tensor value_101_cast_fp16 = add(x = var_5594_cast_fp16, y = var_5596_cast_fp16)[name = tensor("value_101_cast_fp16")]; tensor var_5599 = const()[name = tensor("op_5599"), val = tensor([1, 20, 64, -1])]; tensor var_5600_cast_fp16 = reshape(shape = var_5599, x = query_101_cast_fp16)[name = tensor("op_5600_cast_fp16")]; tensor var_5601_to_fp16 = const()[name = tensor("op_5601_to_fp16"), val = tensor(0x1p-3)]; tensor var_5602_cast_fp16 = mul(x = var_5600_cast_fp16, y = var_5601_to_fp16)[name = tensor("op_5602_cast_fp16")]; tensor var_5603 = const()[name = tensor("op_5603"), val = tensor([1, 20, 64, -1])]; tensor var_5604_cast_fp16 = reshape(shape = var_5603, x = key_101_cast_fp16)[name = tensor("op_5604_cast_fp16")]; tensor mh_w_151_transpose_x_0 = const()[name = tensor("mh_w_151_transpose_x_0"), val = tensor(true)]; tensor mh_w_151_transpose_y_0 = const()[name = tensor("mh_w_151_transpose_y_0"), val = tensor(false)]; tensor mh_w_151_cast_fp16 = matmul(transpose_x = mh_w_151_transpose_x_0, transpose_y = mh_w_151_transpose_y_0, x = var_5602_cast_fp16, y = var_5604_cast_fp16)[name = tensor("mh_w_151_cast_fp16")]; tensor mh_w_153_cast_fp16 = add(x = mh_w_151_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_153_cast_fp16")]; tensor var_5612_cast_fp16 = softmax(axis = var_5526, x = mh_w_153_cast_fp16)[name = tensor("op_5612_cast_fp16")]; tensor var_5613 = const()[name = tensor("op_5613"), val = tensor([1, 20, 64, -1])]; tensor var_5614_cast_fp16 = reshape(shape = var_5613, x = value_101_cast_fp16)[name = tensor("op_5614_cast_fp16")]; tensor attn_101_transpose_x_0 = const()[name = tensor("attn_101_transpose_x_0"), val = tensor(false)]; tensor attn_101_transpose_y_0 = const()[name = tensor("attn_101_transpose_y_0"), val = tensor(true)]; tensor attn_101_cast_fp16 = matmul(transpose_x = attn_101_transpose_x_0, transpose_y = attn_101_transpose_y_0, x = var_5614_cast_fp16, y = var_5612_cast_fp16)[name = tensor("attn_101_cast_fp16")]; tensor var_5617 = const()[name = tensor("op_5617"), val = tensor([1, 1280, 1, -1])]; tensor input_251_cast_fp16 = reshape(shape = var_5617, x = attn_101_cast_fp16)[name = tensor("input_251_cast_fp16")]; tensor var_5621 = const()[name = tensor("op_5621"), val = tensor([1, 1])]; tensor var_5623 = const()[name = tensor("op_5623"), val = tensor([1, 1])]; tensor obj_307_pad_type_0 = const()[name = tensor("obj_307_pad_type_0"), val = tensor("custom")]; tensor obj_307_pad_0 = const()[name = tensor("obj_307_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_25_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(679719296))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(680948160))), name = tensor("layers_25_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_25_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_25_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(680948352)))]; tensor obj_307_cast_fp16 = conv(bias = layers_25_self_attn_o_proj_bias_to_fp16, dilations = var_5623, groups = var_5533, pad = obj_307_pad_0, pad_type = obj_307_pad_type_0, strides = var_5621, weight = layers_25_self_attn_o_proj_weight_to_fp16_palettized, x = input_251_cast_fp16)[name = tensor("obj_307_cast_fp16")]; tensor inputs_153_cast_fp16 = add(x = inputs_151_cast_fp16, y = obj_307_cast_fp16)[name = tensor("inputs_153_cast_fp16")]; tensor var_5633 = const()[name = tensor("op_5633"), val = tensor([1])]; tensor channels_mean_153_cast_fp16 = reduce_mean(axes = var_5633, keep_dims = var_5534, x = inputs_153_cast_fp16)[name = tensor("channels_mean_153_cast_fp16")]; tensor zero_mean_153_cast_fp16 = sub(x = inputs_153_cast_fp16, y = channels_mean_153_cast_fp16)[name = tensor("zero_mean_153_cast_fp16")]; tensor zero_mean_sq_153_cast_fp16 = mul(x = zero_mean_153_cast_fp16, y = zero_mean_153_cast_fp16)[name = tensor("zero_mean_sq_153_cast_fp16")]; tensor var_5637 = const()[name = tensor("op_5637"), val = tensor([1])]; tensor var_5638_cast_fp16 = reduce_mean(axes = var_5637, keep_dims = var_5534, x = zero_mean_sq_153_cast_fp16)[name = tensor("op_5638_cast_fp16")]; tensor var_5639_to_fp16 = const()[name = tensor("op_5639_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5640_cast_fp16 = add(x = var_5638_cast_fp16, y = var_5639_to_fp16)[name = tensor("op_5640_cast_fp16")]; tensor denom_153_epsilon_0 = const()[name = tensor("denom_153_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_153_cast_fp16 = rsqrt(epsilon = denom_153_epsilon_0, x = var_5640_cast_fp16)[name = tensor("denom_153_cast_fp16")]; tensor out_153_cast_fp16 = mul(x = zero_mean_153_cast_fp16, y = denom_153_cast_fp16)[name = tensor("out_153_cast_fp16")]; tensor obj_309_gamma_0_to_fp16 = const()[name = tensor("obj_309_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(680950976)))]; tensor obj_309_beta_0_to_fp16 = const()[name = tensor("obj_309_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(680953600)))]; tensor obj_309_epsilon_0_to_fp16 = const()[name = tensor("obj_309_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_309_cast_fp16 = batch_norm(beta = obj_309_beta_0_to_fp16, epsilon = obj_309_epsilon_0_to_fp16, gamma = obj_309_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_153_cast_fp16)[name = tensor("obj_309_cast_fp16")]; tensor var_5655 = const()[name = tensor("op_5655"), val = tensor([1, 1])]; tensor var_5657 = const()[name = tensor("op_5657"), val = tensor([1, 1])]; tensor query_103_pad_type_0 = const()[name = tensor("query_103_pad_type_0"), val = tensor("custom")]; tensor query_103_pad_0 = const()[name = tensor("query_103_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_25_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(680956224))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(682185088))), name = tensor("layers_25_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_25_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_25_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(682185280)))]; tensor query_103_cast_fp16 = conv(bias = layers_25_encoder_attn_q_proj_bias_to_fp16, dilations = var_5657, groups = var_5533, pad = query_103_pad_0, pad_type = query_103_pad_type_0, strides = var_5655, weight = layers_25_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_309_cast_fp16)[name = tensor("query_103_cast_fp16")]; tensor var_5661 = const()[name = tensor("op_5661"), val = tensor([1, 1])]; tensor var_5663 = const()[name = tensor("op_5663"), val = tensor([1, 1])]; tensor key_103_pad_type_0 = const()[name = tensor("key_103_pad_type_0"), val = tensor("custom")]; tensor key_103_pad_0 = const()[name = tensor("key_103_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_25_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(682187904))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(683007168))), name = tensor("layers_25_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_103_cast_fp16 = conv(dilations = var_5663, groups = var_5533, pad = key_103_pad_0, pad_type = key_103_pad_type_0, strides = var_5661, weight = layers_25_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_103_cast_fp16")]; tensor var_5668 = const()[name = tensor("op_5668"), val = tensor([1, 1])]; tensor var_5670 = const()[name = tensor("op_5670"), val = tensor([1, 1])]; tensor value_103_pad_type_0 = const()[name = tensor("value_103_pad_type_0"), val = tensor("custom")]; tensor value_103_pad_0 = const()[name = tensor("value_103_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_25_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(683007296))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(684236160))), name = tensor("layers_25_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_25_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_25_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(684236352)))]; tensor value_103_cast_fp16 = conv(bias = layers_25_encoder_attn_v_proj_bias_to_fp16, dilations = var_5670, groups = var_5533, pad = value_103_pad_0, pad_type = value_103_pad_type_0, strides = var_5668, weight = layers_25_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_103_cast_fp16")]; tensor var_5674 = const()[name = tensor("op_5674"), val = tensor([1, 20, 64, -1])]; tensor var_5675_cast_fp16 = reshape(shape = var_5674, x = query_103_cast_fp16)[name = tensor("op_5675_cast_fp16")]; tensor var_5676_to_fp16 = const()[name = tensor("op_5676_to_fp16"), val = tensor(0x1p-3)]; tensor var_5677_cast_fp16 = mul(x = var_5675_cast_fp16, y = var_5676_to_fp16)[name = tensor("op_5677_cast_fp16")]; tensor var_5678 = const()[name = tensor("op_5678"), val = tensor([1, 20, 64, -1])]; tensor var_5679_cast_fp16 = reshape(shape = var_5678, x = key_103_cast_fp16)[name = tensor("op_5679_cast_fp16")]; tensor mh_w_155_transpose_x_0 = const()[name = tensor("mh_w_155_transpose_x_0"), val = tensor(true)]; tensor mh_w_155_transpose_y_0 = const()[name = tensor("mh_w_155_transpose_y_0"), val = tensor(false)]; tensor mh_w_155_cast_fp16 = matmul(transpose_x = mh_w_155_transpose_x_0, transpose_y = mh_w_155_transpose_y_0, x = var_5677_cast_fp16, y = var_5679_cast_fp16)[name = tensor("mh_w_155_cast_fp16")]; tensor var_5682_cast_fp16 = softmax(axis = var_5526, x = mh_w_155_cast_fp16)[name = tensor("op_5682_cast_fp16")]; tensor var_5683 = const()[name = tensor("op_5683"), val = tensor([1, 20, 64, -1])]; tensor var_5684_cast_fp16 = reshape(shape = var_5683, x = value_103_cast_fp16)[name = tensor("op_5684_cast_fp16")]; tensor attn_103_transpose_x_0 = const()[name = tensor("attn_103_transpose_x_0"), val = tensor(false)]; tensor attn_103_transpose_y_0 = const()[name = tensor("attn_103_transpose_y_0"), val = tensor(true)]; tensor attn_103_cast_fp16 = matmul(transpose_x = attn_103_transpose_x_0, transpose_y = attn_103_transpose_y_0, x = var_5684_cast_fp16, y = var_5682_cast_fp16)[name = tensor("attn_103_cast_fp16")]; tensor var_5687 = const()[name = tensor("op_5687"), val = tensor([1, 1280, 1, -1])]; tensor input_253_cast_fp16 = reshape(shape = var_5687, x = attn_103_cast_fp16)[name = tensor("input_253_cast_fp16")]; tensor var_5691 = const()[name = tensor("op_5691"), val = tensor([1, 1])]; tensor var_5693 = const()[name = tensor("op_5693"), val = tensor([1, 1])]; tensor obj_311_pad_type_0 = const()[name = tensor("obj_311_pad_type_0"), val = tensor("custom")]; tensor obj_311_pad_0 = const()[name = tensor("obj_311_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_25_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(684238976))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(685467840))), name = tensor("layers_25_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_25_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_25_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(685468032)))]; tensor obj_311_cast_fp16 = conv(bias = layers_25_encoder_attn_o_proj_bias_to_fp16, dilations = var_5693, groups = var_5533, pad = obj_311_pad_0, pad_type = obj_311_pad_type_0, strides = var_5691, weight = layers_25_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_253_cast_fp16)[name = tensor("obj_311_cast_fp16")]; tensor inputs_155_cast_fp16 = add(x = inputs_153_cast_fp16, y = obj_311_cast_fp16)[name = tensor("inputs_155_cast_fp16")]; tensor var_5699 = const()[name = tensor("op_5699"), val = tensor([1])]; tensor channels_mean_155_cast_fp16 = reduce_mean(axes = var_5699, keep_dims = var_5534, x = inputs_155_cast_fp16)[name = tensor("channels_mean_155_cast_fp16")]; tensor zero_mean_155_cast_fp16 = sub(x = inputs_155_cast_fp16, y = channels_mean_155_cast_fp16)[name = tensor("zero_mean_155_cast_fp16")]; tensor zero_mean_sq_155_cast_fp16 = mul(x = zero_mean_155_cast_fp16, y = zero_mean_155_cast_fp16)[name = tensor("zero_mean_sq_155_cast_fp16")]; tensor var_5703 = const()[name = tensor("op_5703"), val = tensor([1])]; tensor var_5704_cast_fp16 = reduce_mean(axes = var_5703, keep_dims = var_5534, x = zero_mean_sq_155_cast_fp16)[name = tensor("op_5704_cast_fp16")]; tensor var_5705_to_fp16 = const()[name = tensor("op_5705_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5706_cast_fp16 = add(x = var_5704_cast_fp16, y = var_5705_to_fp16)[name = tensor("op_5706_cast_fp16")]; tensor denom_155_epsilon_0 = const()[name = tensor("denom_155_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_155_cast_fp16 = rsqrt(epsilon = denom_155_epsilon_0, x = var_5706_cast_fp16)[name = tensor("denom_155_cast_fp16")]; tensor out_155_cast_fp16 = mul(x = zero_mean_155_cast_fp16, y = denom_155_cast_fp16)[name = tensor("out_155_cast_fp16")]; tensor input_255_gamma_0_to_fp16 = const()[name = tensor("input_255_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(685470656)))]; tensor input_255_beta_0_to_fp16 = const()[name = tensor("input_255_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(685473280)))]; tensor input_255_epsilon_0_to_fp16 = const()[name = tensor("input_255_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_255_cast_fp16 = batch_norm(beta = input_255_beta_0_to_fp16, epsilon = input_255_epsilon_0_to_fp16, gamma = input_255_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_155_cast_fp16)[name = tensor("input_255_cast_fp16")]; tensor var_5717 = const()[name = tensor("op_5717"), val = tensor([1, 1])]; tensor var_5719 = const()[name = tensor("op_5719"), val = tensor([1, 1])]; tensor input_257_pad_type_0 = const()[name = tensor("input_257_pad_type_0"), val = tensor("custom")]; tensor input_257_pad_0 = const()[name = tensor("input_257_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_25_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(685475904))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(688752768))), name = tensor("layers_25_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_25_fc1_bias_to_fp16 = const()[name = tensor("layers_25_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(688752896)))]; tensor input_257_cast_fp16 = conv(bias = layers_25_fc1_bias_to_fp16, dilations = var_5719, groups = var_5533, pad = input_257_pad_0, pad_type = input_257_pad_type_0, strides = var_5717, weight = layers_25_fc1_weight_to_fp16_palettized, x = input_255_cast_fp16)[name = tensor("input_257_cast_fp16")]; tensor input_259_mode_0 = const()[name = tensor("input_259_mode_0"), val = tensor("EXACT")]; tensor input_259_cast_fp16 = gelu(mode = input_259_mode_0, x = input_257_cast_fp16)[name = tensor("input_259_cast_fp16")]; tensor var_5725 = const()[name = tensor("op_5725"), val = tensor([1, 1])]; tensor var_5727 = const()[name = tensor("op_5727"), val = tensor([1, 1])]; tensor hidden_states_53_pad_type_0 = const()[name = tensor("hidden_states_53_pad_type_0"), val = tensor("custom")]; tensor hidden_states_53_pad_0 = const()[name = tensor("hidden_states_53_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_25_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(688763200))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(693678464))), name = tensor("layers_25_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_25_fc2_bias_to_fp16 = const()[name = tensor("layers_25_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(693678656)))]; tensor hidden_states_53_cast_fp16 = conv(bias = layers_25_fc2_bias_to_fp16, dilations = var_5727, groups = var_5533, pad = hidden_states_53_pad_0, pad_type = hidden_states_53_pad_type_0, strides = var_5725, weight = layers_25_fc2_weight_to_fp16_palettized, x = input_259_cast_fp16)[name = tensor("hidden_states_53_cast_fp16")]; tensor inputs_157_cast_fp16 = add(x = inputs_155_cast_fp16, y = hidden_states_53_cast_fp16)[name = tensor("inputs_157_cast_fp16")]; tensor var_5740 = const()[name = tensor("op_5740"), val = tensor(3)]; tensor var_5747 = const()[name = tensor("op_5747"), val = tensor(1)]; tensor var_5748 = const()[name = tensor("op_5748"), val = tensor(true)]; tensor var_5760 = const()[name = tensor("op_5760"), val = tensor([1])]; tensor channels_mean_157_cast_fp16 = reduce_mean(axes = var_5760, keep_dims = var_5748, x = inputs_157_cast_fp16)[name = tensor("channels_mean_157_cast_fp16")]; tensor zero_mean_157_cast_fp16 = sub(x = inputs_157_cast_fp16, y = channels_mean_157_cast_fp16)[name = tensor("zero_mean_157_cast_fp16")]; tensor zero_mean_sq_157_cast_fp16 = mul(x = zero_mean_157_cast_fp16, y = zero_mean_157_cast_fp16)[name = tensor("zero_mean_sq_157_cast_fp16")]; tensor var_5764 = const()[name = tensor("op_5764"), val = tensor([1])]; tensor var_5765_cast_fp16 = reduce_mean(axes = var_5764, keep_dims = var_5748, x = zero_mean_sq_157_cast_fp16)[name = tensor("op_5765_cast_fp16")]; tensor var_5766_to_fp16 = const()[name = tensor("op_5766_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5767_cast_fp16 = add(x = var_5765_cast_fp16, y = var_5766_to_fp16)[name = tensor("op_5767_cast_fp16")]; tensor denom_157_epsilon_0 = const()[name = tensor("denom_157_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_157_cast_fp16 = rsqrt(epsilon = denom_157_epsilon_0, x = var_5767_cast_fp16)[name = tensor("denom_157_cast_fp16")]; tensor out_157_cast_fp16 = mul(x = zero_mean_157_cast_fp16, y = denom_157_cast_fp16)[name = tensor("out_157_cast_fp16")]; tensor obj_313_gamma_0_to_fp16 = const()[name = tensor("obj_313_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(693681280)))]; tensor obj_313_beta_0_to_fp16 = const()[name = tensor("obj_313_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(693683904)))]; tensor obj_313_epsilon_0_to_fp16 = const()[name = tensor("obj_313_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_313_cast_fp16 = batch_norm(beta = obj_313_beta_0_to_fp16, epsilon = obj_313_epsilon_0_to_fp16, gamma = obj_313_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_157_cast_fp16)[name = tensor("obj_313_cast_fp16")]; tensor var_5782 = const()[name = tensor("op_5782"), val = tensor([1, 1])]; tensor var_5784 = const()[name = tensor("op_5784"), val = tensor([1, 1])]; tensor query_105_pad_type_0 = const()[name = tensor("query_105_pad_type_0"), val = tensor("custom")]; tensor query_105_pad_0 = const()[name = tensor("query_105_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_26_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(693686528))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(694505792))), name = tensor("layers_26_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_26_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_26_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(694505920)))]; tensor query_105_cast_fp16 = conv(bias = layers_26_self_attn_q_proj_bias_to_fp16, dilations = var_5784, groups = var_5747, pad = query_105_pad_0, pad_type = query_105_pad_type_0, strides = var_5782, weight = layers_26_self_attn_q_proj_weight_to_fp16_palettized, x = obj_313_cast_fp16)[name = tensor("query_105_cast_fp16")]; tensor var_5788 = const()[name = tensor("op_5788"), val = tensor([1, 1])]; tensor var_5790 = const()[name = tensor("op_5790"), val = tensor([1, 1])]; tensor current_key_53_pad_type_0 = const()[name = tensor("current_key_53_pad_type_0"), val = tensor("custom")]; tensor current_key_53_pad_0 = const()[name = tensor("current_key_53_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_26_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(694508544))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696147008))), name = tensor("layers_26_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_53_cast_fp16 = conv(dilations = var_5790, groups = var_5747, pad = current_key_53_pad_0, pad_type = current_key_53_pad_type_0, strides = var_5788, weight = layers_26_self_attn_k_proj_weight_to_fp16_palettized, x = obj_313_cast_fp16)[name = tensor("current_key_53_cast_fp16")]; tensor var_5795 = const()[name = tensor("op_5795"), val = tensor([1, 1])]; tensor var_5797 = const()[name = tensor("op_5797"), val = tensor([1, 1])]; tensor current_value_53_pad_type_0 = const()[name = tensor("current_value_53_pad_type_0"), val = tensor("custom")]; tensor current_value_53_pad_0 = const()[name = tensor("current_value_53_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_26_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696147584))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696966848))), name = tensor("layers_26_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_26_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_26_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696966976)))]; tensor current_value_53_cast_fp16 = conv(bias = layers_26_self_attn_v_proj_bias_to_fp16, dilations = var_5797, groups = var_5747, pad = current_value_53_pad_0, pad_type = current_value_53_pad_type_0, strides = var_5795, weight = layers_26_self_attn_v_proj_weight_to_fp16_palettized, x = obj_313_cast_fp16)[name = tensor("current_value_53_cast_fp16")]; tensor var_5804_cast_fp16 = mul(x = current_key_53_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_5804_cast_fp16")]; tensor var_5806_cast_fp16 = mul(x = var_103_cast_fp16_26, y = var_241_cast_fp16)[name = tensor("op_5806_cast_fp16")]; tensor key_105_cast_fp16 = add(x = var_5804_cast_fp16, y = var_5806_cast_fp16)[name = tensor("key_105_cast_fp16")]; tensor var_5808_cast_fp16 = mul(x = current_value_53_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_5808_cast_fp16")]; tensor var_5810_cast_fp16 = mul(x = var_138_cast_fp16_26, y = var_241_cast_fp16)[name = tensor("op_5810_cast_fp16")]; tensor value_105_cast_fp16 = add(x = var_5808_cast_fp16, y = var_5810_cast_fp16)[name = tensor("value_105_cast_fp16")]; tensor var_5813 = const()[name = tensor("op_5813"), val = tensor([1, 20, 64, -1])]; tensor var_5814_cast_fp16 = reshape(shape = var_5813, x = query_105_cast_fp16)[name = tensor("op_5814_cast_fp16")]; tensor var_5815_to_fp16 = const()[name = tensor("op_5815_to_fp16"), val = tensor(0x1p-3)]; tensor var_5816_cast_fp16 = mul(x = var_5814_cast_fp16, y = var_5815_to_fp16)[name = tensor("op_5816_cast_fp16")]; tensor var_5817 = const()[name = tensor("op_5817"), val = tensor([1, 20, 64, -1])]; tensor var_5818_cast_fp16 = reshape(shape = var_5817, x = key_105_cast_fp16)[name = tensor("op_5818_cast_fp16")]; tensor mh_w_157_transpose_x_0 = const()[name = tensor("mh_w_157_transpose_x_0"), val = tensor(true)]; tensor mh_w_157_transpose_y_0 = const()[name = tensor("mh_w_157_transpose_y_0"), val = tensor(false)]; tensor mh_w_157_cast_fp16 = matmul(transpose_x = mh_w_157_transpose_x_0, transpose_y = mh_w_157_transpose_y_0, x = var_5816_cast_fp16, y = var_5818_cast_fp16)[name = tensor("mh_w_157_cast_fp16")]; tensor mh_w_159_cast_fp16 = add(x = mh_w_157_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_159_cast_fp16")]; tensor var_5826_cast_fp16 = softmax(axis = var_5740, x = mh_w_159_cast_fp16)[name = tensor("op_5826_cast_fp16")]; tensor var_5827 = const()[name = tensor("op_5827"), val = tensor([1, 20, 64, -1])]; tensor var_5828_cast_fp16 = reshape(shape = var_5827, x = value_105_cast_fp16)[name = tensor("op_5828_cast_fp16")]; tensor attn_105_transpose_x_0 = const()[name = tensor("attn_105_transpose_x_0"), val = tensor(false)]; tensor attn_105_transpose_y_0 = const()[name = tensor("attn_105_transpose_y_0"), val = tensor(true)]; tensor attn_105_cast_fp16 = matmul(transpose_x = attn_105_transpose_x_0, transpose_y = attn_105_transpose_y_0, x = var_5828_cast_fp16, y = var_5826_cast_fp16)[name = tensor("attn_105_cast_fp16")]; tensor var_5831 = const()[name = tensor("op_5831"), val = tensor([1, 1280, 1, -1])]; tensor input_261_cast_fp16 = reshape(shape = var_5831, x = attn_105_cast_fp16)[name = tensor("input_261_cast_fp16")]; tensor var_5835 = const()[name = tensor("op_5835"), val = tensor([1, 1])]; tensor var_5837 = const()[name = tensor("op_5837"), val = tensor([1, 1])]; tensor obj_319_pad_type_0 = const()[name = tensor("obj_319_pad_type_0"), val = tensor("custom")]; tensor obj_319_pad_0 = const()[name = tensor("obj_319_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_26_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(696969600))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(697788864))), name = tensor("layers_26_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_26_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_26_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(697788992)))]; tensor obj_319_cast_fp16 = conv(bias = layers_26_self_attn_o_proj_bias_to_fp16, dilations = var_5837, groups = var_5747, pad = obj_319_pad_0, pad_type = obj_319_pad_type_0, strides = var_5835, weight = layers_26_self_attn_o_proj_weight_to_fp16_palettized, x = input_261_cast_fp16)[name = tensor("obj_319_cast_fp16")]; tensor inputs_159_cast_fp16 = add(x = inputs_157_cast_fp16, y = obj_319_cast_fp16)[name = tensor("inputs_159_cast_fp16")]; tensor var_5847 = const()[name = tensor("op_5847"), val = tensor([1])]; tensor channels_mean_159_cast_fp16 = reduce_mean(axes = var_5847, keep_dims = var_5748, x = inputs_159_cast_fp16)[name = tensor("channels_mean_159_cast_fp16")]; tensor zero_mean_159_cast_fp16 = sub(x = inputs_159_cast_fp16, y = channels_mean_159_cast_fp16)[name = tensor("zero_mean_159_cast_fp16")]; tensor zero_mean_sq_159_cast_fp16 = mul(x = zero_mean_159_cast_fp16, y = zero_mean_159_cast_fp16)[name = tensor("zero_mean_sq_159_cast_fp16")]; tensor var_5851 = const()[name = tensor("op_5851"), val = tensor([1])]; tensor var_5852_cast_fp16 = reduce_mean(axes = var_5851, keep_dims = var_5748, x = zero_mean_sq_159_cast_fp16)[name = tensor("op_5852_cast_fp16")]; tensor var_5853_to_fp16 = const()[name = tensor("op_5853_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5854_cast_fp16 = add(x = var_5852_cast_fp16, y = var_5853_to_fp16)[name = tensor("op_5854_cast_fp16")]; tensor denom_159_epsilon_0 = const()[name = tensor("denom_159_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_159_cast_fp16 = rsqrt(epsilon = denom_159_epsilon_0, x = var_5854_cast_fp16)[name = tensor("denom_159_cast_fp16")]; tensor out_159_cast_fp16 = mul(x = zero_mean_159_cast_fp16, y = denom_159_cast_fp16)[name = tensor("out_159_cast_fp16")]; tensor obj_321_gamma_0_to_fp16 = const()[name = tensor("obj_321_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(697791616)))]; tensor obj_321_beta_0_to_fp16 = const()[name = tensor("obj_321_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(697794240)))]; tensor obj_321_epsilon_0_to_fp16 = const()[name = tensor("obj_321_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_321_cast_fp16 = batch_norm(beta = obj_321_beta_0_to_fp16, epsilon = obj_321_epsilon_0_to_fp16, gamma = obj_321_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_159_cast_fp16)[name = tensor("obj_321_cast_fp16")]; tensor var_5869 = const()[name = tensor("op_5869"), val = tensor([1, 1])]; tensor var_5871 = const()[name = tensor("op_5871"), val = tensor([1, 1])]; tensor query_107_pad_type_0 = const()[name = tensor("query_107_pad_type_0"), val = tensor("custom")]; tensor query_107_pad_0 = const()[name = tensor("query_107_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_26_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(697796864))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(699025728))), name = tensor("layers_26_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_26_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_26_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(699025920)))]; tensor query_107_cast_fp16 = conv(bias = layers_26_encoder_attn_q_proj_bias_to_fp16, dilations = var_5871, groups = var_5747, pad = query_107_pad_0, pad_type = query_107_pad_type_0, strides = var_5869, weight = layers_26_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_321_cast_fp16)[name = tensor("query_107_cast_fp16")]; tensor var_5875 = const()[name = tensor("op_5875"), val = tensor([1, 1])]; tensor var_5877 = const()[name = tensor("op_5877"), val = tensor([1, 1])]; tensor key_107_pad_type_0 = const()[name = tensor("key_107_pad_type_0"), val = tensor("custom")]; tensor key_107_pad_0 = const()[name = tensor("key_107_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_26_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(699028544))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(699847808))), name = tensor("layers_26_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_107_cast_fp16 = conv(dilations = var_5877, groups = var_5747, pad = key_107_pad_0, pad_type = key_107_pad_type_0, strides = var_5875, weight = layers_26_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_107_cast_fp16")]; tensor var_5882 = const()[name = tensor("op_5882"), val = tensor([1, 1])]; tensor var_5884 = const()[name = tensor("op_5884"), val = tensor([1, 1])]; tensor value_107_pad_type_0 = const()[name = tensor("value_107_pad_type_0"), val = tensor("custom")]; tensor value_107_pad_0 = const()[name = tensor("value_107_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_26_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(699847936))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(701076800))), name = tensor("layers_26_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_26_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_26_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(701076992)))]; tensor value_107_cast_fp16 = conv(bias = layers_26_encoder_attn_v_proj_bias_to_fp16, dilations = var_5884, groups = var_5747, pad = value_107_pad_0, pad_type = value_107_pad_type_0, strides = var_5882, weight = layers_26_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_107_cast_fp16")]; tensor var_5888 = const()[name = tensor("op_5888"), val = tensor([1, 20, 64, -1])]; tensor var_5889_cast_fp16 = reshape(shape = var_5888, x = query_107_cast_fp16)[name = tensor("op_5889_cast_fp16")]; tensor var_5890_to_fp16 = const()[name = tensor("op_5890_to_fp16"), val = tensor(0x1p-3)]; tensor var_5891_cast_fp16 = mul(x = var_5889_cast_fp16, y = var_5890_to_fp16)[name = tensor("op_5891_cast_fp16")]; tensor var_5892 = const()[name = tensor("op_5892"), val = tensor([1, 20, 64, -1])]; tensor var_5893_cast_fp16 = reshape(shape = var_5892, x = key_107_cast_fp16)[name = tensor("op_5893_cast_fp16")]; tensor mh_w_161_transpose_x_0 = const()[name = tensor("mh_w_161_transpose_x_0"), val = tensor(true)]; tensor mh_w_161_transpose_y_0 = const()[name = tensor("mh_w_161_transpose_y_0"), val = tensor(false)]; tensor mh_w_161_cast_fp16 = matmul(transpose_x = mh_w_161_transpose_x_0, transpose_y = mh_w_161_transpose_y_0, x = var_5891_cast_fp16, y = var_5893_cast_fp16)[name = tensor("mh_w_161_cast_fp16")]; tensor var_5896_cast_fp16 = softmax(axis = var_5740, x = mh_w_161_cast_fp16)[name = tensor("op_5896_cast_fp16")]; tensor var_5897 = const()[name = tensor("op_5897"), val = tensor([1, 20, 64, -1])]; tensor var_5898_cast_fp16 = reshape(shape = var_5897, x = value_107_cast_fp16)[name = tensor("op_5898_cast_fp16")]; tensor attn_107_transpose_x_0 = const()[name = tensor("attn_107_transpose_x_0"), val = tensor(false)]; tensor attn_107_transpose_y_0 = const()[name = tensor("attn_107_transpose_y_0"), val = tensor(true)]; tensor attn_107_cast_fp16 = matmul(transpose_x = attn_107_transpose_x_0, transpose_y = attn_107_transpose_y_0, x = var_5898_cast_fp16, y = var_5896_cast_fp16)[name = tensor("attn_107_cast_fp16")]; tensor var_5901 = const()[name = tensor("op_5901"), val = tensor([1, 1280, 1, -1])]; tensor input_263_cast_fp16 = reshape(shape = var_5901, x = attn_107_cast_fp16)[name = tensor("input_263_cast_fp16")]; tensor var_5905 = const()[name = tensor("op_5905"), val = tensor([1, 1])]; tensor var_5907 = const()[name = tensor("op_5907"), val = tensor([1, 1])]; tensor obj_323_pad_type_0 = const()[name = tensor("obj_323_pad_type_0"), val = tensor("custom")]; tensor obj_323_pad_0 = const()[name = tensor("obj_323_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_26_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(701079616))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(702308480))), name = tensor("layers_26_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_26_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_26_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(702308672)))]; tensor obj_323_cast_fp16 = conv(bias = layers_26_encoder_attn_o_proj_bias_to_fp16, dilations = var_5907, groups = var_5747, pad = obj_323_pad_0, pad_type = obj_323_pad_type_0, strides = var_5905, weight = layers_26_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_263_cast_fp16)[name = tensor("obj_323_cast_fp16")]; tensor inputs_161_cast_fp16 = add(x = inputs_159_cast_fp16, y = obj_323_cast_fp16)[name = tensor("inputs_161_cast_fp16")]; tensor var_5913 = const()[name = tensor("op_5913"), val = tensor([1])]; tensor channels_mean_161_cast_fp16 = reduce_mean(axes = var_5913, keep_dims = var_5748, x = inputs_161_cast_fp16)[name = tensor("channels_mean_161_cast_fp16")]; tensor zero_mean_161_cast_fp16 = sub(x = inputs_161_cast_fp16, y = channels_mean_161_cast_fp16)[name = tensor("zero_mean_161_cast_fp16")]; tensor zero_mean_sq_161_cast_fp16 = mul(x = zero_mean_161_cast_fp16, y = zero_mean_161_cast_fp16)[name = tensor("zero_mean_sq_161_cast_fp16")]; tensor var_5917 = const()[name = tensor("op_5917"), val = tensor([1])]; tensor var_5918_cast_fp16 = reduce_mean(axes = var_5917, keep_dims = var_5748, x = zero_mean_sq_161_cast_fp16)[name = tensor("op_5918_cast_fp16")]; tensor var_5919_to_fp16 = const()[name = tensor("op_5919_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5920_cast_fp16 = add(x = var_5918_cast_fp16, y = var_5919_to_fp16)[name = tensor("op_5920_cast_fp16")]; tensor denom_161_epsilon_0 = const()[name = tensor("denom_161_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_161_cast_fp16 = rsqrt(epsilon = denom_161_epsilon_0, x = var_5920_cast_fp16)[name = tensor("denom_161_cast_fp16")]; tensor out_161_cast_fp16 = mul(x = zero_mean_161_cast_fp16, y = denom_161_cast_fp16)[name = tensor("out_161_cast_fp16")]; tensor input_265_gamma_0_to_fp16 = const()[name = tensor("input_265_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(702311296)))]; tensor input_265_beta_0_to_fp16 = const()[name = tensor("input_265_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(702313920)))]; tensor input_265_epsilon_0_to_fp16 = const()[name = tensor("input_265_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_265_cast_fp16 = batch_norm(beta = input_265_beta_0_to_fp16, epsilon = input_265_epsilon_0_to_fp16, gamma = input_265_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_161_cast_fp16)[name = tensor("input_265_cast_fp16")]; tensor var_5931 = const()[name = tensor("op_5931"), val = tensor([1, 1])]; tensor var_5933 = const()[name = tensor("op_5933"), val = tensor([1, 1])]; tensor input_267_pad_type_0 = const()[name = tensor("input_267_pad_type_0"), val = tensor("custom")]; tensor input_267_pad_0 = const()[name = tensor("input_267_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_26_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(702316544))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(705593408))), name = tensor("layers_26_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_26_fc1_bias_to_fp16 = const()[name = tensor("layers_26_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(705593536)))]; tensor input_267_cast_fp16 = conv(bias = layers_26_fc1_bias_to_fp16, dilations = var_5933, groups = var_5747, pad = input_267_pad_0, pad_type = input_267_pad_type_0, strides = var_5931, weight = layers_26_fc1_weight_to_fp16_palettized, x = input_265_cast_fp16)[name = tensor("input_267_cast_fp16")]; tensor input_269_mode_0 = const()[name = tensor("input_269_mode_0"), val = tensor("EXACT")]; tensor input_269_cast_fp16 = gelu(mode = input_269_mode_0, x = input_267_cast_fp16)[name = tensor("input_269_cast_fp16")]; tensor var_5939 = const()[name = tensor("op_5939"), val = tensor([1, 1])]; tensor var_5941 = const()[name = tensor("op_5941"), val = tensor([1, 1])]; tensor hidden_states_55_pad_type_0 = const()[name = tensor("hidden_states_55_pad_type_0"), val = tensor("custom")]; tensor hidden_states_55_pad_0 = const()[name = tensor("hidden_states_55_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_26_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(705603840))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(710519104))), name = tensor("layers_26_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_26_fc2_bias_to_fp16 = const()[name = tensor("layers_26_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(710519296)))]; tensor hidden_states_55_cast_fp16 = conv(bias = layers_26_fc2_bias_to_fp16, dilations = var_5941, groups = var_5747, pad = hidden_states_55_pad_0, pad_type = hidden_states_55_pad_type_0, strides = var_5939, weight = layers_26_fc2_weight_to_fp16_palettized, x = input_269_cast_fp16)[name = tensor("hidden_states_55_cast_fp16")]; tensor inputs_163_cast_fp16 = add(x = inputs_161_cast_fp16, y = hidden_states_55_cast_fp16)[name = tensor("inputs_163_cast_fp16")]; tensor var_5954 = const()[name = tensor("op_5954"), val = tensor(3)]; tensor var_5961 = const()[name = tensor("op_5961"), val = tensor(1)]; tensor var_5962 = const()[name = tensor("op_5962"), val = tensor(true)]; tensor var_5974 = const()[name = tensor("op_5974"), val = tensor([1])]; tensor channels_mean_163_cast_fp16 = reduce_mean(axes = var_5974, keep_dims = var_5962, x = inputs_163_cast_fp16)[name = tensor("channels_mean_163_cast_fp16")]; tensor zero_mean_163_cast_fp16 = sub(x = inputs_163_cast_fp16, y = channels_mean_163_cast_fp16)[name = tensor("zero_mean_163_cast_fp16")]; tensor zero_mean_sq_163_cast_fp16 = mul(x = zero_mean_163_cast_fp16, y = zero_mean_163_cast_fp16)[name = tensor("zero_mean_sq_163_cast_fp16")]; tensor var_5978 = const()[name = tensor("op_5978"), val = tensor([1])]; tensor var_5979_cast_fp16 = reduce_mean(axes = var_5978, keep_dims = var_5962, x = zero_mean_sq_163_cast_fp16)[name = tensor("op_5979_cast_fp16")]; tensor var_5980_to_fp16 = const()[name = tensor("op_5980_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5981_cast_fp16 = add(x = var_5979_cast_fp16, y = var_5980_to_fp16)[name = tensor("op_5981_cast_fp16")]; tensor denom_163_epsilon_0 = const()[name = tensor("denom_163_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_163_cast_fp16 = rsqrt(epsilon = denom_163_epsilon_0, x = var_5981_cast_fp16)[name = tensor("denom_163_cast_fp16")]; tensor out_163_cast_fp16 = mul(x = zero_mean_163_cast_fp16, y = denom_163_cast_fp16)[name = tensor("out_163_cast_fp16")]; tensor obj_325_gamma_0_to_fp16 = const()[name = tensor("obj_325_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(710521920)))]; tensor obj_325_beta_0_to_fp16 = const()[name = tensor("obj_325_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(710524544)))]; tensor obj_325_epsilon_0_to_fp16 = const()[name = tensor("obj_325_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_325_cast_fp16 = batch_norm(beta = obj_325_beta_0_to_fp16, epsilon = obj_325_epsilon_0_to_fp16, gamma = obj_325_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_163_cast_fp16)[name = tensor("obj_325_cast_fp16")]; tensor var_5996 = const()[name = tensor("op_5996"), val = tensor([1, 1])]; tensor var_5998 = const()[name = tensor("op_5998"), val = tensor([1, 1])]; tensor query_109_pad_type_0 = const()[name = tensor("query_109_pad_type_0"), val = tensor("custom")]; tensor query_109_pad_0 = const()[name = tensor("query_109_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_27_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(710527168))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(711756032))), name = tensor("layers_27_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_27_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_27_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(711756224)))]; tensor query_109_cast_fp16 = conv(bias = layers_27_self_attn_q_proj_bias_to_fp16, dilations = var_5998, groups = var_5961, pad = query_109_pad_0, pad_type = query_109_pad_type_0, strides = var_5996, weight = layers_27_self_attn_q_proj_weight_to_fp16_palettized, x = obj_325_cast_fp16)[name = tensor("query_109_cast_fp16")]; tensor var_6002 = const()[name = tensor("op_6002"), val = tensor([1, 1])]; tensor var_6004 = const()[name = tensor("op_6004"), val = tensor([1, 1])]; tensor current_key_55_pad_type_0 = const()[name = tensor("current_key_55_pad_type_0"), val = tensor("custom")]; tensor current_key_55_pad_0 = const()[name = tensor("current_key_55_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_27_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(711758848))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(712987712))), name = tensor("layers_27_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_55_cast_fp16 = conv(dilations = var_6004, groups = var_5961, pad = current_key_55_pad_0, pad_type = current_key_55_pad_type_0, strides = var_6002, weight = layers_27_self_attn_k_proj_weight_to_fp16_palettized, x = obj_325_cast_fp16)[name = tensor("current_key_55_cast_fp16")]; tensor var_6009 = const()[name = tensor("op_6009"), val = tensor([1, 1])]; tensor var_6011 = const()[name = tensor("op_6011"), val = tensor([1, 1])]; tensor current_value_55_pad_type_0 = const()[name = tensor("current_value_55_pad_type_0"), val = tensor("custom")]; tensor current_value_55_pad_0 = const()[name = tensor("current_value_55_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_27_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(712987904))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(713807168))), name = tensor("layers_27_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_27_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_27_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(713807296)))]; tensor current_value_55_cast_fp16 = conv(bias = layers_27_self_attn_v_proj_bias_to_fp16, dilations = var_6011, groups = var_5961, pad = current_value_55_pad_0, pad_type = current_value_55_pad_type_0, strides = var_6009, weight = layers_27_self_attn_v_proj_weight_to_fp16_palettized, x = obj_325_cast_fp16)[name = tensor("current_value_55_cast_fp16")]; tensor var_6018_cast_fp16 = mul(x = current_key_55_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_6018_cast_fp16")]; tensor var_6020_cast_fp16 = mul(x = var_103_cast_fp16_27, y = var_241_cast_fp16)[name = tensor("op_6020_cast_fp16")]; tensor key_109_cast_fp16 = add(x = var_6018_cast_fp16, y = var_6020_cast_fp16)[name = tensor("key_109_cast_fp16")]; tensor var_6022_cast_fp16 = mul(x = current_value_55_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_6022_cast_fp16")]; tensor var_6024_cast_fp16 = mul(x = var_138_cast_fp16_27, y = var_241_cast_fp16)[name = tensor("op_6024_cast_fp16")]; tensor value_109_cast_fp16 = add(x = var_6022_cast_fp16, y = var_6024_cast_fp16)[name = tensor("value_109_cast_fp16")]; tensor var_6027 = const()[name = tensor("op_6027"), val = tensor([1, 20, 64, -1])]; tensor var_6028_cast_fp16 = reshape(shape = var_6027, x = query_109_cast_fp16)[name = tensor("op_6028_cast_fp16")]; tensor var_6029_to_fp16 = const()[name = tensor("op_6029_to_fp16"), val = tensor(0x1p-3)]; tensor var_6030_cast_fp16 = mul(x = var_6028_cast_fp16, y = var_6029_to_fp16)[name = tensor("op_6030_cast_fp16")]; tensor var_6031 = const()[name = tensor("op_6031"), val = tensor([1, 20, 64, -1])]; tensor var_6032_cast_fp16 = reshape(shape = var_6031, x = key_109_cast_fp16)[name = tensor("op_6032_cast_fp16")]; tensor mh_w_163_transpose_x_0 = const()[name = tensor("mh_w_163_transpose_x_0"), val = tensor(true)]; tensor mh_w_163_transpose_y_0 = const()[name = tensor("mh_w_163_transpose_y_0"), val = tensor(false)]; tensor mh_w_163_cast_fp16 = matmul(transpose_x = mh_w_163_transpose_x_0, transpose_y = mh_w_163_transpose_y_0, x = var_6030_cast_fp16, y = var_6032_cast_fp16)[name = tensor("mh_w_163_cast_fp16")]; tensor mh_w_165_cast_fp16 = add(x = mh_w_163_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_165_cast_fp16")]; tensor var_6040_cast_fp16 = softmax(axis = var_5954, x = mh_w_165_cast_fp16)[name = tensor("op_6040_cast_fp16")]; tensor var_6041 = const()[name = tensor("op_6041"), val = tensor([1, 20, 64, -1])]; tensor var_6042_cast_fp16 = reshape(shape = var_6041, x = value_109_cast_fp16)[name = tensor("op_6042_cast_fp16")]; tensor attn_109_transpose_x_0 = const()[name = tensor("attn_109_transpose_x_0"), val = tensor(false)]; tensor attn_109_transpose_y_0 = const()[name = tensor("attn_109_transpose_y_0"), val = tensor(true)]; tensor attn_109_cast_fp16 = matmul(transpose_x = attn_109_transpose_x_0, transpose_y = attn_109_transpose_y_0, x = var_6042_cast_fp16, y = var_6040_cast_fp16)[name = tensor("attn_109_cast_fp16")]; tensor var_6045 = const()[name = tensor("op_6045"), val = tensor([1, 1280, 1, -1])]; tensor input_271_cast_fp16 = reshape(shape = var_6045, x = attn_109_cast_fp16)[name = tensor("input_271_cast_fp16")]; tensor var_6049 = const()[name = tensor("op_6049"), val = tensor([1, 1])]; tensor var_6051 = const()[name = tensor("op_6051"), val = tensor([1, 1])]; tensor obj_331_pad_type_0 = const()[name = tensor("obj_331_pad_type_0"), val = tensor("custom")]; tensor obj_331_pad_0 = const()[name = tensor("obj_331_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_27_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(713809920))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(715038784))), name = tensor("layers_27_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_27_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_27_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(715038976)))]; tensor obj_331_cast_fp16 = conv(bias = layers_27_self_attn_o_proj_bias_to_fp16, dilations = var_6051, groups = var_5961, pad = obj_331_pad_0, pad_type = obj_331_pad_type_0, strides = var_6049, weight = layers_27_self_attn_o_proj_weight_to_fp16_palettized, x = input_271_cast_fp16)[name = tensor("obj_331_cast_fp16")]; tensor inputs_165_cast_fp16 = add(x = inputs_163_cast_fp16, y = obj_331_cast_fp16)[name = tensor("inputs_165_cast_fp16")]; tensor var_6061 = const()[name = tensor("op_6061"), val = tensor([1])]; tensor channels_mean_165_cast_fp16 = reduce_mean(axes = var_6061, keep_dims = var_5962, x = inputs_165_cast_fp16)[name = tensor("channels_mean_165_cast_fp16")]; tensor zero_mean_165_cast_fp16 = sub(x = inputs_165_cast_fp16, y = channels_mean_165_cast_fp16)[name = tensor("zero_mean_165_cast_fp16")]; tensor zero_mean_sq_165_cast_fp16 = mul(x = zero_mean_165_cast_fp16, y = zero_mean_165_cast_fp16)[name = tensor("zero_mean_sq_165_cast_fp16")]; tensor var_6065 = const()[name = tensor("op_6065"), val = tensor([1])]; tensor var_6066_cast_fp16 = reduce_mean(axes = var_6065, keep_dims = var_5962, x = zero_mean_sq_165_cast_fp16)[name = tensor("op_6066_cast_fp16")]; tensor var_6067_to_fp16 = const()[name = tensor("op_6067_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6068_cast_fp16 = add(x = var_6066_cast_fp16, y = var_6067_to_fp16)[name = tensor("op_6068_cast_fp16")]; tensor denom_165_epsilon_0 = const()[name = tensor("denom_165_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_165_cast_fp16 = rsqrt(epsilon = denom_165_epsilon_0, x = var_6068_cast_fp16)[name = tensor("denom_165_cast_fp16")]; tensor out_165_cast_fp16 = mul(x = zero_mean_165_cast_fp16, y = denom_165_cast_fp16)[name = tensor("out_165_cast_fp16")]; tensor obj_333_gamma_0_to_fp16 = const()[name = tensor("obj_333_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(715041600)))]; tensor obj_333_beta_0_to_fp16 = const()[name = tensor("obj_333_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(715044224)))]; tensor obj_333_epsilon_0_to_fp16 = const()[name = tensor("obj_333_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_333_cast_fp16 = batch_norm(beta = obj_333_beta_0_to_fp16, epsilon = obj_333_epsilon_0_to_fp16, gamma = obj_333_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_165_cast_fp16)[name = tensor("obj_333_cast_fp16")]; tensor var_6083 = const()[name = tensor("op_6083"), val = tensor([1, 1])]; tensor var_6085 = const()[name = tensor("op_6085"), val = tensor([1, 1])]; tensor query_111_pad_type_0 = const()[name = tensor("query_111_pad_type_0"), val = tensor("custom")]; tensor query_111_pad_0 = const()[name = tensor("query_111_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_27_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(715046848))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(716275712))), name = tensor("layers_27_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_27_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_27_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(716275904)))]; tensor query_111_cast_fp16 = conv(bias = layers_27_encoder_attn_q_proj_bias_to_fp16, dilations = var_6085, groups = var_5961, pad = query_111_pad_0, pad_type = query_111_pad_type_0, strides = var_6083, weight = layers_27_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_333_cast_fp16)[name = tensor("query_111_cast_fp16")]; tensor var_6089 = const()[name = tensor("op_6089"), val = tensor([1, 1])]; tensor var_6091 = const()[name = tensor("op_6091"), val = tensor([1, 1])]; tensor key_111_pad_type_0 = const()[name = tensor("key_111_pad_type_0"), val = tensor("custom")]; tensor key_111_pad_0 = const()[name = tensor("key_111_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_27_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(716278528))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(717916992))), name = tensor("layers_27_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_111_cast_fp16 = conv(dilations = var_6091, groups = var_5961, pad = key_111_pad_0, pad_type = key_111_pad_type_0, strides = var_6089, weight = layers_27_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_111_cast_fp16")]; tensor var_6096 = const()[name = tensor("op_6096"), val = tensor([1, 1])]; tensor var_6098 = const()[name = tensor("op_6098"), val = tensor([1, 1])]; tensor value_111_pad_type_0 = const()[name = tensor("value_111_pad_type_0"), val = tensor("custom")]; tensor value_111_pad_0 = const()[name = tensor("value_111_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_27_encoder_attn_v_proj_weight_to_fp16 = const()[name = tensor("layers_27_encoder_attn_v_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(717917568)))]; tensor layers_27_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_27_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(721194432)))]; tensor value_111_cast_fp16 = conv(bias = layers_27_encoder_attn_v_proj_bias_to_fp16, dilations = var_6098, groups = var_5961, pad = value_111_pad_0, pad_type = value_111_pad_type_0, strides = var_6096, weight = layers_27_encoder_attn_v_proj_weight_to_fp16, x = encoder_output_embeds)[name = tensor("value_111_cast_fp16")]; tensor var_6102 = const()[name = tensor("op_6102"), val = tensor([1, 20, 64, -1])]; tensor var_6103_cast_fp16 = reshape(shape = var_6102, x = query_111_cast_fp16)[name = tensor("op_6103_cast_fp16")]; tensor var_6104_to_fp16 = const()[name = tensor("op_6104_to_fp16"), val = tensor(0x1p-3)]; tensor var_6105_cast_fp16 = mul(x = var_6103_cast_fp16, y = var_6104_to_fp16)[name = tensor("op_6105_cast_fp16")]; tensor var_6106 = const()[name = tensor("op_6106"), val = tensor([1, 20, 64, -1])]; tensor var_6107_cast_fp16 = reshape(shape = var_6106, x = key_111_cast_fp16)[name = tensor("op_6107_cast_fp16")]; tensor mh_w_167_transpose_x_0 = const()[name = tensor("mh_w_167_transpose_x_0"), val = tensor(true)]; tensor mh_w_167_transpose_y_0 = const()[name = tensor("mh_w_167_transpose_y_0"), val = tensor(false)]; tensor mh_w_167_cast_fp16 = matmul(transpose_x = mh_w_167_transpose_x_0, transpose_y = mh_w_167_transpose_y_0, x = var_6105_cast_fp16, y = var_6107_cast_fp16)[name = tensor("mh_w_167_cast_fp16")]; tensor var_6110_cast_fp16 = softmax(axis = var_5954, x = mh_w_167_cast_fp16)[name = tensor("op_6110_cast_fp16")]; tensor var_6111 = const()[name = tensor("op_6111"), val = tensor([1, 20, 64, -1])]; tensor var_6112_cast_fp16 = reshape(shape = var_6111, x = value_111_cast_fp16)[name = tensor("op_6112_cast_fp16")]; tensor attn_111_transpose_x_0 = const()[name = tensor("attn_111_transpose_x_0"), val = tensor(false)]; tensor attn_111_transpose_y_0 = const()[name = tensor("attn_111_transpose_y_0"), val = tensor(true)]; tensor attn_111_cast_fp16 = matmul(transpose_x = attn_111_transpose_x_0, transpose_y = attn_111_transpose_y_0, x = var_6112_cast_fp16, y = var_6110_cast_fp16)[name = tensor("attn_111_cast_fp16")]; tensor var_6115 = const()[name = tensor("op_6115"), val = tensor([1, 1280, 1, -1])]; tensor input_273_cast_fp16 = reshape(shape = var_6115, x = attn_111_cast_fp16)[name = tensor("input_273_cast_fp16")]; tensor var_6119 = const()[name = tensor("op_6119"), val = tensor([1, 1])]; tensor var_6121 = const()[name = tensor("op_6121"), val = tensor([1, 1])]; tensor obj_335_pad_type_0 = const()[name = tensor("obj_335_pad_type_0"), val = tensor("custom")]; tensor obj_335_pad_0 = const()[name = tensor("obj_335_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_27_encoder_attn_o_proj_weight_to_fp16 = const()[name = tensor("layers_27_encoder_attn_o_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(721197056)))]; tensor layers_27_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_27_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(724473920)))]; tensor obj_335_cast_fp16 = conv(bias = layers_27_encoder_attn_o_proj_bias_to_fp16, dilations = var_6121, groups = var_5961, pad = obj_335_pad_0, pad_type = obj_335_pad_type_0, strides = var_6119, weight = layers_27_encoder_attn_o_proj_weight_to_fp16, x = input_273_cast_fp16)[name = tensor("obj_335_cast_fp16")]; tensor inputs_167_cast_fp16 = add(x = inputs_165_cast_fp16, y = obj_335_cast_fp16)[name = tensor("inputs_167_cast_fp16")]; tensor var_6127 = const()[name = tensor("op_6127"), val = tensor([1])]; tensor channels_mean_167_cast_fp16 = reduce_mean(axes = var_6127, keep_dims = var_5962, x = inputs_167_cast_fp16)[name = tensor("channels_mean_167_cast_fp16")]; tensor zero_mean_167_cast_fp16 = sub(x = inputs_167_cast_fp16, y = channels_mean_167_cast_fp16)[name = tensor("zero_mean_167_cast_fp16")]; tensor zero_mean_sq_167_cast_fp16 = mul(x = zero_mean_167_cast_fp16, y = zero_mean_167_cast_fp16)[name = tensor("zero_mean_sq_167_cast_fp16")]; tensor var_6131 = const()[name = tensor("op_6131"), val = tensor([1])]; tensor var_6132_cast_fp16 = reduce_mean(axes = var_6131, keep_dims = var_5962, x = zero_mean_sq_167_cast_fp16)[name = tensor("op_6132_cast_fp16")]; tensor var_6133_to_fp16 = const()[name = tensor("op_6133_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6134_cast_fp16 = add(x = var_6132_cast_fp16, y = var_6133_to_fp16)[name = tensor("op_6134_cast_fp16")]; tensor denom_167_epsilon_0 = const()[name = tensor("denom_167_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_167_cast_fp16 = rsqrt(epsilon = denom_167_epsilon_0, x = var_6134_cast_fp16)[name = tensor("denom_167_cast_fp16")]; tensor out_167_cast_fp16 = mul(x = zero_mean_167_cast_fp16, y = denom_167_cast_fp16)[name = tensor("out_167_cast_fp16")]; tensor input_275_gamma_0_to_fp16 = const()[name = tensor("input_275_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(724476544)))]; tensor input_275_beta_0_to_fp16 = const()[name = tensor("input_275_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(724479168)))]; tensor input_275_epsilon_0_to_fp16 = const()[name = tensor("input_275_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_275_cast_fp16 = batch_norm(beta = input_275_beta_0_to_fp16, epsilon = input_275_epsilon_0_to_fp16, gamma = input_275_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_167_cast_fp16)[name = tensor("input_275_cast_fp16")]; tensor var_6145 = const()[name = tensor("op_6145"), val = tensor([1, 1])]; tensor var_6147 = const()[name = tensor("op_6147"), val = tensor([1, 1])]; tensor input_277_pad_type_0 = const()[name = tensor("input_277_pad_type_0"), val = tensor("custom")]; tensor input_277_pad_0 = const()[name = tensor("input_277_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_27_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(724481792))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(729397056))), name = tensor("layers_27_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_27_fc1_bias_to_fp16 = const()[name = tensor("layers_27_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(729397248)))]; tensor input_277_cast_fp16 = conv(bias = layers_27_fc1_bias_to_fp16, dilations = var_6147, groups = var_5961, pad = input_277_pad_0, pad_type = input_277_pad_type_0, strides = var_6145, weight = layers_27_fc1_weight_to_fp16_palettized, x = input_275_cast_fp16)[name = tensor("input_277_cast_fp16")]; tensor input_279_mode_0 = const()[name = tensor("input_279_mode_0"), val = tensor("EXACT")]; tensor input_279_cast_fp16 = gelu(mode = input_279_mode_0, x = input_277_cast_fp16)[name = tensor("input_279_cast_fp16")]; tensor var_6153 = const()[name = tensor("op_6153"), val = tensor([1, 1])]; tensor var_6155 = const()[name = tensor("op_6155"), val = tensor([1, 1])]; tensor hidden_states_57_pad_type_0 = const()[name = tensor("hidden_states_57_pad_type_0"), val = tensor("custom")]; tensor hidden_states_57_pad_0 = const()[name = tensor("hidden_states_57_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_27_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(729407552))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(734322816))), name = tensor("layers_27_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_27_fc2_bias_to_fp16 = const()[name = tensor("layers_27_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(734323008)))]; tensor hidden_states_57_cast_fp16 = conv(bias = layers_27_fc2_bias_to_fp16, dilations = var_6155, groups = var_5961, pad = hidden_states_57_pad_0, pad_type = hidden_states_57_pad_type_0, strides = var_6153, weight = layers_27_fc2_weight_to_fp16_palettized, x = input_279_cast_fp16)[name = tensor("hidden_states_57_cast_fp16")]; tensor inputs_169_cast_fp16 = add(x = inputs_167_cast_fp16, y = hidden_states_57_cast_fp16)[name = tensor("inputs_169_cast_fp16")]; tensor var_6168 = const()[name = tensor("op_6168"), val = tensor(3)]; tensor var_6175 = const()[name = tensor("op_6175"), val = tensor(1)]; tensor var_6176 = const()[name = tensor("op_6176"), val = tensor(true)]; tensor var_6188 = const()[name = tensor("op_6188"), val = tensor([1])]; tensor channels_mean_169_cast_fp16 = reduce_mean(axes = var_6188, keep_dims = var_6176, x = inputs_169_cast_fp16)[name = tensor("channels_mean_169_cast_fp16")]; tensor zero_mean_169_cast_fp16 = sub(x = inputs_169_cast_fp16, y = channels_mean_169_cast_fp16)[name = tensor("zero_mean_169_cast_fp16")]; tensor zero_mean_sq_169_cast_fp16 = mul(x = zero_mean_169_cast_fp16, y = zero_mean_169_cast_fp16)[name = tensor("zero_mean_sq_169_cast_fp16")]; tensor var_6192 = const()[name = tensor("op_6192"), val = tensor([1])]; tensor var_6193_cast_fp16 = reduce_mean(axes = var_6192, keep_dims = var_6176, x = zero_mean_sq_169_cast_fp16)[name = tensor("op_6193_cast_fp16")]; tensor var_6194_to_fp16 = const()[name = tensor("op_6194_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6195_cast_fp16 = add(x = var_6193_cast_fp16, y = var_6194_to_fp16)[name = tensor("op_6195_cast_fp16")]; tensor denom_169_epsilon_0 = const()[name = tensor("denom_169_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_169_cast_fp16 = rsqrt(epsilon = denom_169_epsilon_0, x = var_6195_cast_fp16)[name = tensor("denom_169_cast_fp16")]; tensor out_169_cast_fp16 = mul(x = zero_mean_169_cast_fp16, y = denom_169_cast_fp16)[name = tensor("out_169_cast_fp16")]; tensor obj_337_gamma_0_to_fp16 = const()[name = tensor("obj_337_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(734325632)))]; tensor obj_337_beta_0_to_fp16 = const()[name = tensor("obj_337_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(734328256)))]; tensor obj_337_epsilon_0_to_fp16 = const()[name = tensor("obj_337_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_337_cast_fp16 = batch_norm(beta = obj_337_beta_0_to_fp16, epsilon = obj_337_epsilon_0_to_fp16, gamma = obj_337_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_169_cast_fp16)[name = tensor("obj_337_cast_fp16")]; tensor var_6210 = const()[name = tensor("op_6210"), val = tensor([1, 1])]; tensor var_6212 = const()[name = tensor("op_6212"), val = tensor([1, 1])]; tensor query_113_pad_type_0 = const()[name = tensor("query_113_pad_type_0"), val = tensor("custom")]; tensor query_113_pad_0 = const()[name = tensor("query_113_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_28_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(734330880))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(735559744))), name = tensor("layers_28_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_28_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_28_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(735559936)))]; tensor query_113_cast_fp16 = conv(bias = layers_28_self_attn_q_proj_bias_to_fp16, dilations = var_6212, groups = var_6175, pad = query_113_pad_0, pad_type = query_113_pad_type_0, strides = var_6210, weight = layers_28_self_attn_q_proj_weight_to_fp16_palettized, x = obj_337_cast_fp16)[name = tensor("query_113_cast_fp16")]; tensor var_6216 = const()[name = tensor("op_6216"), val = tensor([1, 1])]; tensor var_6218 = const()[name = tensor("op_6218"), val = tensor([1, 1])]; tensor current_key_57_pad_type_0 = const()[name = tensor("current_key_57_pad_type_0"), val = tensor("custom")]; tensor current_key_57_pad_0 = const()[name = tensor("current_key_57_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_28_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(735562560))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736381824))), name = tensor("layers_28_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_57_cast_fp16 = conv(dilations = var_6218, groups = var_6175, pad = current_key_57_pad_0, pad_type = current_key_57_pad_type_0, strides = var_6216, weight = layers_28_self_attn_k_proj_weight_to_fp16_palettized, x = obj_337_cast_fp16)[name = tensor("current_key_57_cast_fp16")]; tensor var_6223 = const()[name = tensor("op_6223"), val = tensor([1, 1])]; tensor var_6225 = const()[name = tensor("op_6225"), val = tensor([1, 1])]; tensor current_value_57_pad_type_0 = const()[name = tensor("current_value_57_pad_type_0"), val = tensor("custom")]; tensor current_value_57_pad_0 = const()[name = tensor("current_value_57_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_28_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(736381952))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(737201216))), name = tensor("layers_28_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_28_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_28_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(737201344)))]; tensor current_value_57_cast_fp16 = conv(bias = layers_28_self_attn_v_proj_bias_to_fp16, dilations = var_6225, groups = var_6175, pad = current_value_57_pad_0, pad_type = current_value_57_pad_type_0, strides = var_6223, weight = layers_28_self_attn_v_proj_weight_to_fp16_palettized, x = obj_337_cast_fp16)[name = tensor("current_value_57_cast_fp16")]; tensor var_6232_cast_fp16 = mul(x = current_key_57_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_6232_cast_fp16")]; tensor var_6234_cast_fp16 = mul(x = var_103_cast_fp16_28, y = var_241_cast_fp16)[name = tensor("op_6234_cast_fp16")]; tensor key_113_cast_fp16 = add(x = var_6232_cast_fp16, y = var_6234_cast_fp16)[name = tensor("key_113_cast_fp16")]; tensor var_6236_cast_fp16 = mul(x = current_value_57_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_6236_cast_fp16")]; tensor var_6238_cast_fp16 = mul(x = var_138_cast_fp16_28, y = var_241_cast_fp16)[name = tensor("op_6238_cast_fp16")]; tensor value_113_cast_fp16 = add(x = var_6236_cast_fp16, y = var_6238_cast_fp16)[name = tensor("value_113_cast_fp16")]; tensor var_6241 = const()[name = tensor("op_6241"), val = tensor([1, 20, 64, -1])]; tensor var_6242_cast_fp16 = reshape(shape = var_6241, x = query_113_cast_fp16)[name = tensor("op_6242_cast_fp16")]; tensor var_6243_to_fp16 = const()[name = tensor("op_6243_to_fp16"), val = tensor(0x1p-3)]; tensor var_6244_cast_fp16 = mul(x = var_6242_cast_fp16, y = var_6243_to_fp16)[name = tensor("op_6244_cast_fp16")]; tensor var_6245 = const()[name = tensor("op_6245"), val = tensor([1, 20, 64, -1])]; tensor var_6246_cast_fp16 = reshape(shape = var_6245, x = key_113_cast_fp16)[name = tensor("op_6246_cast_fp16")]; tensor mh_w_169_transpose_x_0 = const()[name = tensor("mh_w_169_transpose_x_0"), val = tensor(true)]; tensor mh_w_169_transpose_y_0 = const()[name = tensor("mh_w_169_transpose_y_0"), val = tensor(false)]; tensor mh_w_169_cast_fp16 = matmul(transpose_x = mh_w_169_transpose_x_0, transpose_y = mh_w_169_transpose_y_0, x = var_6244_cast_fp16, y = var_6246_cast_fp16)[name = tensor("mh_w_169_cast_fp16")]; tensor mh_w_171_cast_fp16 = add(x = mh_w_169_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_171_cast_fp16")]; tensor var_6254_cast_fp16 = softmax(axis = var_6168, x = mh_w_171_cast_fp16)[name = tensor("op_6254_cast_fp16")]; tensor var_6255 = const()[name = tensor("op_6255"), val = tensor([1, 20, 64, -1])]; tensor var_6256_cast_fp16 = reshape(shape = var_6255, x = value_113_cast_fp16)[name = tensor("op_6256_cast_fp16")]; tensor attn_113_transpose_x_0 = const()[name = tensor("attn_113_transpose_x_0"), val = tensor(false)]; tensor attn_113_transpose_y_0 = const()[name = tensor("attn_113_transpose_y_0"), val = tensor(true)]; tensor attn_113_cast_fp16 = matmul(transpose_x = attn_113_transpose_x_0, transpose_y = attn_113_transpose_y_0, x = var_6256_cast_fp16, y = var_6254_cast_fp16)[name = tensor("attn_113_cast_fp16")]; tensor var_6259 = const()[name = tensor("op_6259"), val = tensor([1, 1280, 1, -1])]; tensor input_281_cast_fp16 = reshape(shape = var_6259, x = attn_113_cast_fp16)[name = tensor("input_281_cast_fp16")]; tensor var_6263 = const()[name = tensor("op_6263"), val = tensor([1, 1])]; tensor var_6265 = const()[name = tensor("op_6265"), val = tensor([1, 1])]; tensor obj_343_pad_type_0 = const()[name = tensor("obj_343_pad_type_0"), val = tensor("custom")]; tensor obj_343_pad_0 = const()[name = tensor("obj_343_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_28_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(737203968))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(738023232))), name = tensor("layers_28_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_28_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_28_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(738023360)))]; tensor obj_343_cast_fp16 = conv(bias = layers_28_self_attn_o_proj_bias_to_fp16, dilations = var_6265, groups = var_6175, pad = obj_343_pad_0, pad_type = obj_343_pad_type_0, strides = var_6263, weight = layers_28_self_attn_o_proj_weight_to_fp16_palettized, x = input_281_cast_fp16)[name = tensor("obj_343_cast_fp16")]; tensor inputs_171_cast_fp16 = add(x = inputs_169_cast_fp16, y = obj_343_cast_fp16)[name = tensor("inputs_171_cast_fp16")]; tensor var_6275 = const()[name = tensor("op_6275"), val = tensor([1])]; tensor channels_mean_171_cast_fp16 = reduce_mean(axes = var_6275, keep_dims = var_6176, x = inputs_171_cast_fp16)[name = tensor("channels_mean_171_cast_fp16")]; tensor zero_mean_171_cast_fp16 = sub(x = inputs_171_cast_fp16, y = channels_mean_171_cast_fp16)[name = tensor("zero_mean_171_cast_fp16")]; tensor zero_mean_sq_171_cast_fp16 = mul(x = zero_mean_171_cast_fp16, y = zero_mean_171_cast_fp16)[name = tensor("zero_mean_sq_171_cast_fp16")]; tensor var_6279 = const()[name = tensor("op_6279"), val = tensor([1])]; tensor var_6280_cast_fp16 = reduce_mean(axes = var_6279, keep_dims = var_6176, x = zero_mean_sq_171_cast_fp16)[name = tensor("op_6280_cast_fp16")]; tensor var_6281_to_fp16 = const()[name = tensor("op_6281_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6282_cast_fp16 = add(x = var_6280_cast_fp16, y = var_6281_to_fp16)[name = tensor("op_6282_cast_fp16")]; tensor denom_171_epsilon_0 = const()[name = tensor("denom_171_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_171_cast_fp16 = rsqrt(epsilon = denom_171_epsilon_0, x = var_6282_cast_fp16)[name = tensor("denom_171_cast_fp16")]; tensor out_171_cast_fp16 = mul(x = zero_mean_171_cast_fp16, y = denom_171_cast_fp16)[name = tensor("out_171_cast_fp16")]; tensor obj_345_gamma_0_to_fp16 = const()[name = tensor("obj_345_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(738025984)))]; tensor obj_345_beta_0_to_fp16 = const()[name = tensor("obj_345_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(738028608)))]; tensor obj_345_epsilon_0_to_fp16 = const()[name = tensor("obj_345_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_345_cast_fp16 = batch_norm(beta = obj_345_beta_0_to_fp16, epsilon = obj_345_epsilon_0_to_fp16, gamma = obj_345_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_171_cast_fp16)[name = tensor("obj_345_cast_fp16")]; tensor var_6297 = const()[name = tensor("op_6297"), val = tensor([1, 1])]; tensor var_6299 = const()[name = tensor("op_6299"), val = tensor([1, 1])]; tensor query_115_pad_type_0 = const()[name = tensor("query_115_pad_type_0"), val = tensor("custom")]; tensor query_115_pad_0 = const()[name = tensor("query_115_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_28_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(738031232))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(739260096))), name = tensor("layers_28_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_28_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_28_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(739260288)))]; tensor query_115_cast_fp16 = conv(bias = layers_28_encoder_attn_q_proj_bias_to_fp16, dilations = var_6299, groups = var_6175, pad = query_115_pad_0, pad_type = query_115_pad_type_0, strides = var_6297, weight = layers_28_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_345_cast_fp16)[name = tensor("query_115_cast_fp16")]; tensor var_6303 = const()[name = tensor("op_6303"), val = tensor([1, 1])]; tensor var_6305 = const()[name = tensor("op_6305"), val = tensor([1, 1])]; tensor key_115_pad_type_0 = const()[name = tensor("key_115_pad_type_0"), val = tensor("custom")]; tensor key_115_pad_0 = const()[name = tensor("key_115_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_28_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(739262912))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(740491776))), name = tensor("layers_28_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_115_cast_fp16 = conv(dilations = var_6305, groups = var_6175, pad = key_115_pad_0, pad_type = key_115_pad_type_0, strides = var_6303, weight = layers_28_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_115_cast_fp16")]; tensor var_6310 = const()[name = tensor("op_6310"), val = tensor([1, 1])]; tensor var_6312 = const()[name = tensor("op_6312"), val = tensor([1, 1])]; tensor value_115_pad_type_0 = const()[name = tensor("value_115_pad_type_0"), val = tensor("custom")]; tensor value_115_pad_0 = const()[name = tensor("value_115_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_28_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(740491968))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(742130432))), name = tensor("layers_28_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_28_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_28_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(742131008)))]; tensor value_115_cast_fp16 = conv(bias = layers_28_encoder_attn_v_proj_bias_to_fp16, dilations = var_6312, groups = var_6175, pad = value_115_pad_0, pad_type = value_115_pad_type_0, strides = var_6310, weight = layers_28_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_115_cast_fp16")]; tensor var_6316 = const()[name = tensor("op_6316"), val = tensor([1, 20, 64, -1])]; tensor var_6317_cast_fp16 = reshape(shape = var_6316, x = query_115_cast_fp16)[name = tensor("op_6317_cast_fp16")]; tensor var_6318_to_fp16 = const()[name = tensor("op_6318_to_fp16"), val = tensor(0x1p-3)]; tensor var_6319_cast_fp16 = mul(x = var_6317_cast_fp16, y = var_6318_to_fp16)[name = tensor("op_6319_cast_fp16")]; tensor var_6320 = const()[name = tensor("op_6320"), val = tensor([1, 20, 64, -1])]; tensor var_6321_cast_fp16 = reshape(shape = var_6320, x = key_115_cast_fp16)[name = tensor("op_6321_cast_fp16")]; tensor mh_w_173_transpose_x_0 = const()[name = tensor("mh_w_173_transpose_x_0"), val = tensor(true)]; tensor mh_w_173_transpose_y_0 = const()[name = tensor("mh_w_173_transpose_y_0"), val = tensor(false)]; tensor mh_w_173_cast_fp16 = matmul(transpose_x = mh_w_173_transpose_x_0, transpose_y = mh_w_173_transpose_y_0, x = var_6319_cast_fp16, y = var_6321_cast_fp16)[name = tensor("mh_w_173_cast_fp16")]; tensor var_6324_cast_fp16 = softmax(axis = var_6168, x = mh_w_173_cast_fp16)[name = tensor("op_6324_cast_fp16")]; tensor var_6325 = const()[name = tensor("op_6325"), val = tensor([1, 20, 64, -1])]; tensor var_6326_cast_fp16 = reshape(shape = var_6325, x = value_115_cast_fp16)[name = tensor("op_6326_cast_fp16")]; tensor attn_115_transpose_x_0 = const()[name = tensor("attn_115_transpose_x_0"), val = tensor(false)]; tensor attn_115_transpose_y_0 = const()[name = tensor("attn_115_transpose_y_0"), val = tensor(true)]; tensor attn_115_cast_fp16 = matmul(transpose_x = attn_115_transpose_x_0, transpose_y = attn_115_transpose_y_0, x = var_6326_cast_fp16, y = var_6324_cast_fp16)[name = tensor("attn_115_cast_fp16")]; tensor var_6329 = const()[name = tensor("op_6329"), val = tensor([1, 1280, 1, -1])]; tensor input_283_cast_fp16 = reshape(shape = var_6329, x = attn_115_cast_fp16)[name = tensor("input_283_cast_fp16")]; tensor var_6333 = const()[name = tensor("op_6333"), val = tensor([1, 1])]; tensor var_6335 = const()[name = tensor("op_6335"), val = tensor([1, 1])]; tensor obj_347_pad_type_0 = const()[name = tensor("obj_347_pad_type_0"), val = tensor("custom")]; tensor obj_347_pad_0 = const()[name = tensor("obj_347_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_28_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(742133632))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(743362496))), name = tensor("layers_28_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_28_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_28_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(743362688)))]; tensor obj_347_cast_fp16 = conv(bias = layers_28_encoder_attn_o_proj_bias_to_fp16, dilations = var_6335, groups = var_6175, pad = obj_347_pad_0, pad_type = obj_347_pad_type_0, strides = var_6333, weight = layers_28_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_283_cast_fp16)[name = tensor("obj_347_cast_fp16")]; tensor inputs_173_cast_fp16 = add(x = inputs_171_cast_fp16, y = obj_347_cast_fp16)[name = tensor("inputs_173_cast_fp16")]; tensor var_6341 = const()[name = tensor("op_6341"), val = tensor([1])]; tensor channels_mean_173_cast_fp16 = reduce_mean(axes = var_6341, keep_dims = var_6176, x = inputs_173_cast_fp16)[name = tensor("channels_mean_173_cast_fp16")]; tensor zero_mean_173_cast_fp16 = sub(x = inputs_173_cast_fp16, y = channels_mean_173_cast_fp16)[name = tensor("zero_mean_173_cast_fp16")]; tensor zero_mean_sq_173_cast_fp16 = mul(x = zero_mean_173_cast_fp16, y = zero_mean_173_cast_fp16)[name = tensor("zero_mean_sq_173_cast_fp16")]; tensor var_6345 = const()[name = tensor("op_6345"), val = tensor([1])]; tensor var_6346_cast_fp16 = reduce_mean(axes = var_6345, keep_dims = var_6176, x = zero_mean_sq_173_cast_fp16)[name = tensor("op_6346_cast_fp16")]; tensor var_6347_to_fp16 = const()[name = tensor("op_6347_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6348_cast_fp16 = add(x = var_6346_cast_fp16, y = var_6347_to_fp16)[name = tensor("op_6348_cast_fp16")]; tensor denom_173_epsilon_0 = const()[name = tensor("denom_173_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_173_cast_fp16 = rsqrt(epsilon = denom_173_epsilon_0, x = var_6348_cast_fp16)[name = tensor("denom_173_cast_fp16")]; tensor out_173_cast_fp16 = mul(x = zero_mean_173_cast_fp16, y = denom_173_cast_fp16)[name = tensor("out_173_cast_fp16")]; tensor input_285_gamma_0_to_fp16 = const()[name = tensor("input_285_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(743365312)))]; tensor input_285_beta_0_to_fp16 = const()[name = tensor("input_285_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(743367936)))]; tensor input_285_epsilon_0_to_fp16 = const()[name = tensor("input_285_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_285_cast_fp16 = batch_norm(beta = input_285_beta_0_to_fp16, epsilon = input_285_epsilon_0_to_fp16, gamma = input_285_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_173_cast_fp16)[name = tensor("input_285_cast_fp16")]; tensor var_6359 = const()[name = tensor("op_6359"), val = tensor([1, 1])]; tensor var_6361 = const()[name = tensor("op_6361"), val = tensor([1, 1])]; tensor input_287_pad_type_0 = const()[name = tensor("input_287_pad_type_0"), val = tensor("custom")]; tensor input_287_pad_0 = const()[name = tensor("input_287_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_28_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(743370560))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(748285824))), name = tensor("layers_28_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_28_fc1_bias_to_fp16 = const()[name = tensor("layers_28_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(748286016)))]; tensor input_287_cast_fp16 = conv(bias = layers_28_fc1_bias_to_fp16, dilations = var_6361, groups = var_6175, pad = input_287_pad_0, pad_type = input_287_pad_type_0, strides = var_6359, weight = layers_28_fc1_weight_to_fp16_palettized, x = input_285_cast_fp16)[name = tensor("input_287_cast_fp16")]; tensor input_289_mode_0 = const()[name = tensor("input_289_mode_0"), val = tensor("EXACT")]; tensor input_289_cast_fp16 = gelu(mode = input_289_mode_0, x = input_287_cast_fp16)[name = tensor("input_289_cast_fp16")]; tensor var_6367 = const()[name = tensor("op_6367"), val = tensor([1, 1])]; tensor var_6369 = const()[name = tensor("op_6369"), val = tensor([1, 1])]; tensor hidden_states_59_pad_type_0 = const()[name = tensor("hidden_states_59_pad_type_0"), val = tensor("custom")]; tensor hidden_states_59_pad_0 = const()[name = tensor("hidden_states_59_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_28_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(748296320))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(753211584))), name = tensor("layers_28_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_28_fc2_bias_to_fp16 = const()[name = tensor("layers_28_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(753211776)))]; tensor hidden_states_59_cast_fp16 = conv(bias = layers_28_fc2_bias_to_fp16, dilations = var_6369, groups = var_6175, pad = hidden_states_59_pad_0, pad_type = hidden_states_59_pad_type_0, strides = var_6367, weight = layers_28_fc2_weight_to_fp16_palettized, x = input_289_cast_fp16)[name = tensor("hidden_states_59_cast_fp16")]; tensor inputs_175_cast_fp16 = add(x = inputs_173_cast_fp16, y = hidden_states_59_cast_fp16)[name = tensor("inputs_175_cast_fp16")]; tensor var_6382 = const()[name = tensor("op_6382"), val = tensor(3)]; tensor var_6389 = const()[name = tensor("op_6389"), val = tensor(1)]; tensor var_6390 = const()[name = tensor("op_6390"), val = tensor(true)]; tensor var_6402 = const()[name = tensor("op_6402"), val = tensor([1])]; tensor channels_mean_175_cast_fp16 = reduce_mean(axes = var_6402, keep_dims = var_6390, x = inputs_175_cast_fp16)[name = tensor("channels_mean_175_cast_fp16")]; tensor zero_mean_175_cast_fp16 = sub(x = inputs_175_cast_fp16, y = channels_mean_175_cast_fp16)[name = tensor("zero_mean_175_cast_fp16")]; tensor zero_mean_sq_175_cast_fp16 = mul(x = zero_mean_175_cast_fp16, y = zero_mean_175_cast_fp16)[name = tensor("zero_mean_sq_175_cast_fp16")]; tensor var_6406 = const()[name = tensor("op_6406"), val = tensor([1])]; tensor var_6407_cast_fp16 = reduce_mean(axes = var_6406, keep_dims = var_6390, x = zero_mean_sq_175_cast_fp16)[name = tensor("op_6407_cast_fp16")]; tensor var_6408_to_fp16 = const()[name = tensor("op_6408_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6409_cast_fp16 = add(x = var_6407_cast_fp16, y = var_6408_to_fp16)[name = tensor("op_6409_cast_fp16")]; tensor denom_175_epsilon_0 = const()[name = tensor("denom_175_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_175_cast_fp16 = rsqrt(epsilon = denom_175_epsilon_0, x = var_6409_cast_fp16)[name = tensor("denom_175_cast_fp16")]; tensor out_175_cast_fp16 = mul(x = zero_mean_175_cast_fp16, y = denom_175_cast_fp16)[name = tensor("out_175_cast_fp16")]; tensor obj_349_gamma_0_to_fp16 = const()[name = tensor("obj_349_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(753214400)))]; tensor obj_349_beta_0_to_fp16 = const()[name = tensor("obj_349_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(753217024)))]; tensor obj_349_epsilon_0_to_fp16 = const()[name = tensor("obj_349_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_349_cast_fp16 = batch_norm(beta = obj_349_beta_0_to_fp16, epsilon = obj_349_epsilon_0_to_fp16, gamma = obj_349_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_175_cast_fp16)[name = tensor("obj_349_cast_fp16")]; tensor var_6424 = const()[name = tensor("op_6424"), val = tensor([1, 1])]; tensor var_6426 = const()[name = tensor("op_6426"), val = tensor([1, 1])]; tensor query_117_pad_type_0 = const()[name = tensor("query_117_pad_type_0"), val = tensor("custom")]; tensor query_117_pad_0 = const()[name = tensor("query_117_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_29_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(753219648))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(754038912))), name = tensor("layers_29_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_29_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_29_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(754039040)))]; tensor query_117_cast_fp16 = conv(bias = layers_29_self_attn_q_proj_bias_to_fp16, dilations = var_6426, groups = var_6389, pad = query_117_pad_0, pad_type = query_117_pad_type_0, strides = var_6424, weight = layers_29_self_attn_q_proj_weight_to_fp16_palettized, x = obj_349_cast_fp16)[name = tensor("query_117_cast_fp16")]; tensor var_6430 = const()[name = tensor("op_6430"), val = tensor([1, 1])]; tensor var_6432 = const()[name = tensor("op_6432"), val = tensor([1, 1])]; tensor current_key_59_pad_type_0 = const()[name = tensor("current_key_59_pad_type_0"), val = tensor("custom")]; tensor current_key_59_pad_0 = const()[name = tensor("current_key_59_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_29_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(754041664))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(754860928))), name = tensor("layers_29_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_59_cast_fp16 = conv(dilations = var_6432, groups = var_6389, pad = current_key_59_pad_0, pad_type = current_key_59_pad_type_0, strides = var_6430, weight = layers_29_self_attn_k_proj_weight_to_fp16_palettized, x = obj_349_cast_fp16)[name = tensor("current_key_59_cast_fp16")]; tensor var_6437 = const()[name = tensor("op_6437"), val = tensor([1, 1])]; tensor var_6439 = const()[name = tensor("op_6439"), val = tensor([1, 1])]; tensor current_value_59_pad_type_0 = const()[name = tensor("current_value_59_pad_type_0"), val = tensor("custom")]; tensor current_value_59_pad_0 = const()[name = tensor("current_value_59_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_29_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(754861056))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(755680320))), name = tensor("layers_29_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_29_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_29_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(755680448)))]; tensor current_value_59_cast_fp16 = conv(bias = layers_29_self_attn_v_proj_bias_to_fp16, dilations = var_6439, groups = var_6389, pad = current_value_59_pad_0, pad_type = current_value_59_pad_type_0, strides = var_6437, weight = layers_29_self_attn_v_proj_weight_to_fp16_palettized, x = obj_349_cast_fp16)[name = tensor("current_value_59_cast_fp16")]; tensor var_6446_cast_fp16 = mul(x = current_key_59_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_6446_cast_fp16")]; tensor var_6448_cast_fp16 = mul(x = var_103_cast_fp16_29, y = var_241_cast_fp16)[name = tensor("op_6448_cast_fp16")]; tensor key_117_cast_fp16 = add(x = var_6446_cast_fp16, y = var_6448_cast_fp16)[name = tensor("key_117_cast_fp16")]; tensor var_6450_cast_fp16 = mul(x = current_value_59_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_6450_cast_fp16")]; tensor var_6452_cast_fp16 = mul(x = var_138_cast_fp16_29, y = var_241_cast_fp16)[name = tensor("op_6452_cast_fp16")]; tensor value_117_cast_fp16 = add(x = var_6450_cast_fp16, y = var_6452_cast_fp16)[name = tensor("value_117_cast_fp16")]; tensor var_6455 = const()[name = tensor("op_6455"), val = tensor([1, 20, 64, -1])]; tensor var_6456_cast_fp16 = reshape(shape = var_6455, x = query_117_cast_fp16)[name = tensor("op_6456_cast_fp16")]; tensor var_6457_to_fp16 = const()[name = tensor("op_6457_to_fp16"), val = tensor(0x1p-3)]; tensor var_6458_cast_fp16 = mul(x = var_6456_cast_fp16, y = var_6457_to_fp16)[name = tensor("op_6458_cast_fp16")]; tensor var_6459 = const()[name = tensor("op_6459"), val = tensor([1, 20, 64, -1])]; tensor var_6460_cast_fp16 = reshape(shape = var_6459, x = key_117_cast_fp16)[name = tensor("op_6460_cast_fp16")]; tensor mh_w_175_transpose_x_0 = const()[name = tensor("mh_w_175_transpose_x_0"), val = tensor(true)]; tensor mh_w_175_transpose_y_0 = const()[name = tensor("mh_w_175_transpose_y_0"), val = tensor(false)]; tensor mh_w_175_cast_fp16 = matmul(transpose_x = mh_w_175_transpose_x_0, transpose_y = mh_w_175_transpose_y_0, x = var_6458_cast_fp16, y = var_6460_cast_fp16)[name = tensor("mh_w_175_cast_fp16")]; tensor mh_w_177_cast_fp16 = add(x = mh_w_175_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_177_cast_fp16")]; tensor var_6468_cast_fp16 = softmax(axis = var_6382, x = mh_w_177_cast_fp16)[name = tensor("op_6468_cast_fp16")]; tensor var_6469 = const()[name = tensor("op_6469"), val = tensor([1, 20, 64, -1])]; tensor var_6470_cast_fp16 = reshape(shape = var_6469, x = value_117_cast_fp16)[name = tensor("op_6470_cast_fp16")]; tensor attn_117_transpose_x_0 = const()[name = tensor("attn_117_transpose_x_0"), val = tensor(false)]; tensor attn_117_transpose_y_0 = const()[name = tensor("attn_117_transpose_y_0"), val = tensor(true)]; tensor attn_117_cast_fp16 = matmul(transpose_x = attn_117_transpose_x_0, transpose_y = attn_117_transpose_y_0, x = var_6470_cast_fp16, y = var_6468_cast_fp16)[name = tensor("attn_117_cast_fp16")]; tensor var_6473 = const()[name = tensor("op_6473"), val = tensor([1, 1280, 1, -1])]; tensor input_291_cast_fp16 = reshape(shape = var_6473, x = attn_117_cast_fp16)[name = tensor("input_291_cast_fp16")]; tensor var_6477 = const()[name = tensor("op_6477"), val = tensor([1, 1])]; tensor var_6479 = const()[name = tensor("op_6479"), val = tensor([1, 1])]; tensor obj_355_pad_type_0 = const()[name = tensor("obj_355_pad_type_0"), val = tensor("custom")]; tensor obj_355_pad_0 = const()[name = tensor("obj_355_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_29_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(755683072))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(756502336))), name = tensor("layers_29_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_29_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_29_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(756502464)))]; tensor obj_355_cast_fp16 = conv(bias = layers_29_self_attn_o_proj_bias_to_fp16, dilations = var_6479, groups = var_6389, pad = obj_355_pad_0, pad_type = obj_355_pad_type_0, strides = var_6477, weight = layers_29_self_attn_o_proj_weight_to_fp16_palettized, x = input_291_cast_fp16)[name = tensor("obj_355_cast_fp16")]; tensor inputs_177_cast_fp16 = add(x = inputs_175_cast_fp16, y = obj_355_cast_fp16)[name = tensor("inputs_177_cast_fp16")]; tensor var_6489 = const()[name = tensor("op_6489"), val = tensor([1])]; tensor channels_mean_177_cast_fp16 = reduce_mean(axes = var_6489, keep_dims = var_6390, x = inputs_177_cast_fp16)[name = tensor("channels_mean_177_cast_fp16")]; tensor zero_mean_177_cast_fp16 = sub(x = inputs_177_cast_fp16, y = channels_mean_177_cast_fp16)[name = tensor("zero_mean_177_cast_fp16")]; tensor zero_mean_sq_177_cast_fp16 = mul(x = zero_mean_177_cast_fp16, y = zero_mean_177_cast_fp16)[name = tensor("zero_mean_sq_177_cast_fp16")]; tensor var_6493 = const()[name = tensor("op_6493"), val = tensor([1])]; tensor var_6494_cast_fp16 = reduce_mean(axes = var_6493, keep_dims = var_6390, x = zero_mean_sq_177_cast_fp16)[name = tensor("op_6494_cast_fp16")]; tensor var_6495_to_fp16 = const()[name = tensor("op_6495_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6496_cast_fp16 = add(x = var_6494_cast_fp16, y = var_6495_to_fp16)[name = tensor("op_6496_cast_fp16")]; tensor denom_177_epsilon_0 = const()[name = tensor("denom_177_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_177_cast_fp16 = rsqrt(epsilon = denom_177_epsilon_0, x = var_6496_cast_fp16)[name = tensor("denom_177_cast_fp16")]; tensor out_177_cast_fp16 = mul(x = zero_mean_177_cast_fp16, y = denom_177_cast_fp16)[name = tensor("out_177_cast_fp16")]; tensor obj_357_gamma_0_to_fp16 = const()[name = tensor("obj_357_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(756505088)))]; tensor obj_357_beta_0_to_fp16 = const()[name = tensor("obj_357_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(756507712)))]; tensor obj_357_epsilon_0_to_fp16 = const()[name = tensor("obj_357_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_357_cast_fp16 = batch_norm(beta = obj_357_beta_0_to_fp16, epsilon = obj_357_epsilon_0_to_fp16, gamma = obj_357_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_177_cast_fp16)[name = tensor("obj_357_cast_fp16")]; tensor var_6511 = const()[name = tensor("op_6511"), val = tensor([1, 1])]; tensor var_6513 = const()[name = tensor("op_6513"), val = tensor([1, 1])]; tensor query_119_pad_type_0 = const()[name = tensor("query_119_pad_type_0"), val = tensor("custom")]; tensor query_119_pad_0 = const()[name = tensor("query_119_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_29_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(756510336))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(757329600))), name = tensor("layers_29_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_29_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_29_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(757329728)))]; tensor query_119_cast_fp16 = conv(bias = layers_29_encoder_attn_q_proj_bias_to_fp16, dilations = var_6513, groups = var_6389, pad = query_119_pad_0, pad_type = query_119_pad_type_0, strides = var_6511, weight = layers_29_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_357_cast_fp16)[name = tensor("query_119_cast_fp16")]; tensor var_6517 = const()[name = tensor("op_6517"), val = tensor([1, 1])]; tensor var_6519 = const()[name = tensor("op_6519"), val = tensor([1, 1])]; tensor key_119_pad_type_0 = const()[name = tensor("key_119_pad_type_0"), val = tensor("custom")]; tensor key_119_pad_0 = const()[name = tensor("key_119_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_29_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(757332352))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(758151616))), name = tensor("layers_29_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_119_cast_fp16 = conv(dilations = var_6519, groups = var_6389, pad = key_119_pad_0, pad_type = key_119_pad_type_0, strides = var_6517, weight = layers_29_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_119_cast_fp16")]; tensor var_6524 = const()[name = tensor("op_6524"), val = tensor([1, 1])]; tensor var_6526 = const()[name = tensor("op_6526"), val = tensor([1, 1])]; tensor value_119_pad_type_0 = const()[name = tensor("value_119_pad_type_0"), val = tensor("custom")]; tensor value_119_pad_0 = const()[name = tensor("value_119_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_29_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(758151744))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(759380608))), name = tensor("layers_29_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_29_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_29_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(759380800)))]; tensor value_119_cast_fp16 = conv(bias = layers_29_encoder_attn_v_proj_bias_to_fp16, dilations = var_6526, groups = var_6389, pad = value_119_pad_0, pad_type = value_119_pad_type_0, strides = var_6524, weight = layers_29_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_119_cast_fp16")]; tensor var_6530 = const()[name = tensor("op_6530"), val = tensor([1, 20, 64, -1])]; tensor var_6531_cast_fp16 = reshape(shape = var_6530, x = query_119_cast_fp16)[name = tensor("op_6531_cast_fp16")]; tensor var_6532_to_fp16 = const()[name = tensor("op_6532_to_fp16"), val = tensor(0x1p-3)]; tensor var_6533_cast_fp16 = mul(x = var_6531_cast_fp16, y = var_6532_to_fp16)[name = tensor("op_6533_cast_fp16")]; tensor var_6534 = const()[name = tensor("op_6534"), val = tensor([1, 20, 64, -1])]; tensor var_6535_cast_fp16 = reshape(shape = var_6534, x = key_119_cast_fp16)[name = tensor("op_6535_cast_fp16")]; tensor mh_w_179_transpose_x_0 = const()[name = tensor("mh_w_179_transpose_x_0"), val = tensor(true)]; tensor mh_w_179_transpose_y_0 = const()[name = tensor("mh_w_179_transpose_y_0"), val = tensor(false)]; tensor mh_w_179_cast_fp16 = matmul(transpose_x = mh_w_179_transpose_x_0, transpose_y = mh_w_179_transpose_y_0, x = var_6533_cast_fp16, y = var_6535_cast_fp16)[name = tensor("mh_w_179_cast_fp16")]; tensor var_6538_cast_fp16 = softmax(axis = var_6382, x = mh_w_179_cast_fp16)[name = tensor("op_6538_cast_fp16")]; tensor var_6539 = const()[name = tensor("op_6539"), val = tensor([1, 20, 64, -1])]; tensor var_6540_cast_fp16 = reshape(shape = var_6539, x = value_119_cast_fp16)[name = tensor("op_6540_cast_fp16")]; tensor attn_119_transpose_x_0 = const()[name = tensor("attn_119_transpose_x_0"), val = tensor(false)]; tensor attn_119_transpose_y_0 = const()[name = tensor("attn_119_transpose_y_0"), val = tensor(true)]; tensor attn_119_cast_fp16 = matmul(transpose_x = attn_119_transpose_x_0, transpose_y = attn_119_transpose_y_0, x = var_6540_cast_fp16, y = var_6538_cast_fp16)[name = tensor("attn_119_cast_fp16")]; tensor var_6543 = const()[name = tensor("op_6543"), val = tensor([1, 1280, 1, -1])]; tensor input_293_cast_fp16 = reshape(shape = var_6543, x = attn_119_cast_fp16)[name = tensor("input_293_cast_fp16")]; tensor var_6547 = const()[name = tensor("op_6547"), val = tensor([1, 1])]; tensor var_6549 = const()[name = tensor("op_6549"), val = tensor([1, 1])]; tensor obj_359_pad_type_0 = const()[name = tensor("obj_359_pad_type_0"), val = tensor("custom")]; tensor obj_359_pad_0 = const()[name = tensor("obj_359_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_29_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(759383424))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(760202688))), name = tensor("layers_29_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_29_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_29_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(760202816)))]; tensor obj_359_cast_fp16 = conv(bias = layers_29_encoder_attn_o_proj_bias_to_fp16, dilations = var_6549, groups = var_6389, pad = obj_359_pad_0, pad_type = obj_359_pad_type_0, strides = var_6547, weight = layers_29_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_293_cast_fp16)[name = tensor("obj_359_cast_fp16")]; tensor inputs_179_cast_fp16 = add(x = inputs_177_cast_fp16, y = obj_359_cast_fp16)[name = tensor("inputs_179_cast_fp16")]; tensor var_6555 = const()[name = tensor("op_6555"), val = tensor([1])]; tensor channels_mean_179_cast_fp16 = reduce_mean(axes = var_6555, keep_dims = var_6390, x = inputs_179_cast_fp16)[name = tensor("channels_mean_179_cast_fp16")]; tensor zero_mean_179_cast_fp16 = sub(x = inputs_179_cast_fp16, y = channels_mean_179_cast_fp16)[name = tensor("zero_mean_179_cast_fp16")]; tensor zero_mean_sq_179_cast_fp16 = mul(x = zero_mean_179_cast_fp16, y = zero_mean_179_cast_fp16)[name = tensor("zero_mean_sq_179_cast_fp16")]; tensor var_6559 = const()[name = tensor("op_6559"), val = tensor([1])]; tensor var_6560_cast_fp16 = reduce_mean(axes = var_6559, keep_dims = var_6390, x = zero_mean_sq_179_cast_fp16)[name = tensor("op_6560_cast_fp16")]; tensor var_6561_to_fp16 = const()[name = tensor("op_6561_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6562_cast_fp16 = add(x = var_6560_cast_fp16, y = var_6561_to_fp16)[name = tensor("op_6562_cast_fp16")]; tensor denom_179_epsilon_0 = const()[name = tensor("denom_179_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_179_cast_fp16 = rsqrt(epsilon = denom_179_epsilon_0, x = var_6562_cast_fp16)[name = tensor("denom_179_cast_fp16")]; tensor out_179_cast_fp16 = mul(x = zero_mean_179_cast_fp16, y = denom_179_cast_fp16)[name = tensor("out_179_cast_fp16")]; tensor input_295_gamma_0_to_fp16 = const()[name = tensor("input_295_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(760205440)))]; tensor input_295_beta_0_to_fp16 = const()[name = tensor("input_295_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(760208064)))]; tensor input_295_epsilon_0_to_fp16 = const()[name = tensor("input_295_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_295_cast_fp16 = batch_norm(beta = input_295_beta_0_to_fp16, epsilon = input_295_epsilon_0_to_fp16, gamma = input_295_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_179_cast_fp16)[name = tensor("input_295_cast_fp16")]; tensor var_6573 = const()[name = tensor("op_6573"), val = tensor([1, 1])]; tensor var_6575 = const()[name = tensor("op_6575"), val = tensor([1, 1])]; tensor input_297_pad_type_0 = const()[name = tensor("input_297_pad_type_0"), val = tensor("custom")]; tensor input_297_pad_0 = const()[name = tensor("input_297_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_29_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(760210688))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765125952))), name = tensor("layers_29_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_29_fc1_bias_to_fp16 = const()[name = tensor("layers_29_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765126144)))]; tensor input_297_cast_fp16 = conv(bias = layers_29_fc1_bias_to_fp16, dilations = var_6575, groups = var_6389, pad = input_297_pad_0, pad_type = input_297_pad_type_0, strides = var_6573, weight = layers_29_fc1_weight_to_fp16_palettized, x = input_295_cast_fp16)[name = tensor("input_297_cast_fp16")]; tensor input_299_mode_0 = const()[name = tensor("input_299_mode_0"), val = tensor("EXACT")]; tensor input_299_cast_fp16 = gelu(mode = input_299_mode_0, x = input_297_cast_fp16)[name = tensor("input_299_cast_fp16")]; tensor var_6581 = const()[name = tensor("op_6581"), val = tensor([1, 1])]; tensor var_6583 = const()[name = tensor("op_6583"), val = tensor([1, 1])]; tensor hidden_states_61_pad_type_0 = const()[name = tensor("hidden_states_61_pad_type_0"), val = tensor("custom")]; tensor hidden_states_61_pad_0 = const()[name = tensor("hidden_states_61_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_29_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765136448))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(771690112))), name = tensor("layers_29_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_29_fc2_bias_to_fp16 = const()[name = tensor("layers_29_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(771690688)))]; tensor hidden_states_61_cast_fp16 = conv(bias = layers_29_fc2_bias_to_fp16, dilations = var_6583, groups = var_6389, pad = hidden_states_61_pad_0, pad_type = hidden_states_61_pad_type_0, strides = var_6581, weight = layers_29_fc2_weight_to_fp16_palettized, x = input_299_cast_fp16)[name = tensor("hidden_states_61_cast_fp16")]; tensor inputs_181_cast_fp16 = add(x = inputs_179_cast_fp16, y = hidden_states_61_cast_fp16)[name = tensor("inputs_181_cast_fp16")]; tensor var_6596 = const()[name = tensor("op_6596"), val = tensor(3)]; tensor var_6603 = const()[name = tensor("op_6603"), val = tensor(1)]; tensor var_6604 = const()[name = tensor("op_6604"), val = tensor(true)]; tensor var_6616 = const()[name = tensor("op_6616"), val = tensor([1])]; tensor channels_mean_181_cast_fp16 = reduce_mean(axes = var_6616, keep_dims = var_6604, x = inputs_181_cast_fp16)[name = tensor("channels_mean_181_cast_fp16")]; tensor zero_mean_181_cast_fp16 = sub(x = inputs_181_cast_fp16, y = channels_mean_181_cast_fp16)[name = tensor("zero_mean_181_cast_fp16")]; tensor zero_mean_sq_181_cast_fp16 = mul(x = zero_mean_181_cast_fp16, y = zero_mean_181_cast_fp16)[name = tensor("zero_mean_sq_181_cast_fp16")]; tensor var_6620 = const()[name = tensor("op_6620"), val = tensor([1])]; tensor var_6621_cast_fp16 = reduce_mean(axes = var_6620, keep_dims = var_6604, x = zero_mean_sq_181_cast_fp16)[name = tensor("op_6621_cast_fp16")]; tensor var_6622_to_fp16 = const()[name = tensor("op_6622_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6623_cast_fp16 = add(x = var_6621_cast_fp16, y = var_6622_to_fp16)[name = tensor("op_6623_cast_fp16")]; tensor denom_181_epsilon_0 = const()[name = tensor("denom_181_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_181_cast_fp16 = rsqrt(epsilon = denom_181_epsilon_0, x = var_6623_cast_fp16)[name = tensor("denom_181_cast_fp16")]; tensor out_181_cast_fp16 = mul(x = zero_mean_181_cast_fp16, y = denom_181_cast_fp16)[name = tensor("out_181_cast_fp16")]; tensor obj_361_gamma_0_to_fp16 = const()[name = tensor("obj_361_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(771693312)))]; tensor obj_361_beta_0_to_fp16 = const()[name = tensor("obj_361_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(771695936)))]; tensor obj_361_epsilon_0_to_fp16 = const()[name = tensor("obj_361_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_361_cast_fp16 = batch_norm(beta = obj_361_beta_0_to_fp16, epsilon = obj_361_epsilon_0_to_fp16, gamma = obj_361_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_181_cast_fp16)[name = tensor("obj_361_cast_fp16")]; tensor var_6638 = const()[name = tensor("op_6638"), val = tensor([1, 1])]; tensor var_6640 = const()[name = tensor("op_6640"), val = tensor([1, 1])]; tensor query_121_pad_type_0 = const()[name = tensor("query_121_pad_type_0"), val = tensor("custom")]; tensor query_121_pad_0 = const()[name = tensor("query_121_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_30_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(771698560))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(772517824))), name = tensor("layers_30_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_30_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_30_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(772517952)))]; tensor query_121_cast_fp16 = conv(bias = layers_30_self_attn_q_proj_bias_to_fp16, dilations = var_6640, groups = var_6603, pad = query_121_pad_0, pad_type = query_121_pad_type_0, strides = var_6638, weight = layers_30_self_attn_q_proj_weight_to_fp16_palettized, x = obj_361_cast_fp16)[name = tensor("query_121_cast_fp16")]; tensor var_6644 = const()[name = tensor("op_6644"), val = tensor([1, 1])]; tensor var_6646 = const()[name = tensor("op_6646"), val = tensor([1, 1])]; tensor current_key_61_pad_type_0 = const()[name = tensor("current_key_61_pad_type_0"), val = tensor("custom")]; tensor current_key_61_pad_0 = const()[name = tensor("current_key_61_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_30_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(772520576))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(773339840))), name = tensor("layers_30_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_61_cast_fp16 = conv(dilations = var_6646, groups = var_6603, pad = current_key_61_pad_0, pad_type = current_key_61_pad_type_0, strides = var_6644, weight = layers_30_self_attn_k_proj_weight_to_fp16_palettized, x = obj_361_cast_fp16)[name = tensor("current_key_61_cast_fp16")]; tensor var_6651 = const()[name = tensor("op_6651"), val = tensor([1, 1])]; tensor var_6653 = const()[name = tensor("op_6653"), val = tensor([1, 1])]; tensor current_value_61_pad_type_0 = const()[name = tensor("current_value_61_pad_type_0"), val = tensor("custom")]; tensor current_value_61_pad_0 = const()[name = tensor("current_value_61_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_30_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(773339968))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(774159232))), name = tensor("layers_30_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_30_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_30_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(774159360)))]; tensor current_value_61_cast_fp16 = conv(bias = layers_30_self_attn_v_proj_bias_to_fp16, dilations = var_6653, groups = var_6603, pad = current_value_61_pad_0, pad_type = current_value_61_pad_type_0, strides = var_6651, weight = layers_30_self_attn_v_proj_weight_to_fp16_palettized, x = obj_361_cast_fp16)[name = tensor("current_value_61_cast_fp16")]; tensor var_6660_cast_fp16 = mul(x = current_key_61_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_6660_cast_fp16")]; tensor var_6662_cast_fp16 = mul(x = var_103_cast_fp16_30, y = var_241_cast_fp16)[name = tensor("op_6662_cast_fp16")]; tensor key_121_cast_fp16 = add(x = var_6660_cast_fp16, y = var_6662_cast_fp16)[name = tensor("key_121_cast_fp16")]; tensor var_6664_cast_fp16 = mul(x = current_value_61_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_6664_cast_fp16")]; tensor var_6666_cast_fp16 = mul(x = var_138_cast_fp16_30, y = var_241_cast_fp16)[name = tensor("op_6666_cast_fp16")]; tensor value_121_cast_fp16 = add(x = var_6664_cast_fp16, y = var_6666_cast_fp16)[name = tensor("value_121_cast_fp16")]; tensor var_6669 = const()[name = tensor("op_6669"), val = tensor([1, 20, 64, -1])]; tensor var_6670_cast_fp16 = reshape(shape = var_6669, x = query_121_cast_fp16)[name = tensor("op_6670_cast_fp16")]; tensor var_6671_to_fp16 = const()[name = tensor("op_6671_to_fp16"), val = tensor(0x1p-3)]; tensor var_6672_cast_fp16 = mul(x = var_6670_cast_fp16, y = var_6671_to_fp16)[name = tensor("op_6672_cast_fp16")]; tensor var_6673 = const()[name = tensor("op_6673"), val = tensor([1, 20, 64, -1])]; tensor var_6674_cast_fp16 = reshape(shape = var_6673, x = key_121_cast_fp16)[name = tensor("op_6674_cast_fp16")]; tensor mh_w_181_transpose_x_0 = const()[name = tensor("mh_w_181_transpose_x_0"), val = tensor(true)]; tensor mh_w_181_transpose_y_0 = const()[name = tensor("mh_w_181_transpose_y_0"), val = tensor(false)]; tensor mh_w_181_cast_fp16 = matmul(transpose_x = mh_w_181_transpose_x_0, transpose_y = mh_w_181_transpose_y_0, x = var_6672_cast_fp16, y = var_6674_cast_fp16)[name = tensor("mh_w_181_cast_fp16")]; tensor mh_w_183_cast_fp16 = add(x = mh_w_181_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_183_cast_fp16")]; tensor var_6682_cast_fp16 = softmax(axis = var_6596, x = mh_w_183_cast_fp16)[name = tensor("op_6682_cast_fp16")]; tensor var_6683 = const()[name = tensor("op_6683"), val = tensor([1, 20, 64, -1])]; tensor var_6684_cast_fp16 = reshape(shape = var_6683, x = value_121_cast_fp16)[name = tensor("op_6684_cast_fp16")]; tensor attn_121_transpose_x_0 = const()[name = tensor("attn_121_transpose_x_0"), val = tensor(false)]; tensor attn_121_transpose_y_0 = const()[name = tensor("attn_121_transpose_y_0"), val = tensor(true)]; tensor attn_121_cast_fp16 = matmul(transpose_x = attn_121_transpose_x_0, transpose_y = attn_121_transpose_y_0, x = var_6684_cast_fp16, y = var_6682_cast_fp16)[name = tensor("attn_121_cast_fp16")]; tensor var_6687 = const()[name = tensor("op_6687"), val = tensor([1, 1280, 1, -1])]; tensor input_301_cast_fp16 = reshape(shape = var_6687, x = attn_121_cast_fp16)[name = tensor("input_301_cast_fp16")]; tensor var_6691 = const()[name = tensor("op_6691"), val = tensor([1, 1])]; tensor var_6693 = const()[name = tensor("op_6693"), val = tensor([1, 1])]; tensor obj_367_pad_type_0 = const()[name = tensor("obj_367_pad_type_0"), val = tensor("custom")]; tensor obj_367_pad_0 = const()[name = tensor("obj_367_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_30_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(774161984))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(774981248))), name = tensor("layers_30_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_30_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_30_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(774981376)))]; tensor obj_367_cast_fp16 = conv(bias = layers_30_self_attn_o_proj_bias_to_fp16, dilations = var_6693, groups = var_6603, pad = obj_367_pad_0, pad_type = obj_367_pad_type_0, strides = var_6691, weight = layers_30_self_attn_o_proj_weight_to_fp16_palettized, x = input_301_cast_fp16)[name = tensor("obj_367_cast_fp16")]; tensor inputs_183_cast_fp16 = add(x = inputs_181_cast_fp16, y = obj_367_cast_fp16)[name = tensor("inputs_183_cast_fp16")]; tensor var_6703 = const()[name = tensor("op_6703"), val = tensor([1])]; tensor channels_mean_183_cast_fp16 = reduce_mean(axes = var_6703, keep_dims = var_6604, x = inputs_183_cast_fp16)[name = tensor("channels_mean_183_cast_fp16")]; tensor zero_mean_183_cast_fp16 = sub(x = inputs_183_cast_fp16, y = channels_mean_183_cast_fp16)[name = tensor("zero_mean_183_cast_fp16")]; tensor zero_mean_sq_183_cast_fp16 = mul(x = zero_mean_183_cast_fp16, y = zero_mean_183_cast_fp16)[name = tensor("zero_mean_sq_183_cast_fp16")]; tensor var_6707 = const()[name = tensor("op_6707"), val = tensor([1])]; tensor var_6708_cast_fp16 = reduce_mean(axes = var_6707, keep_dims = var_6604, x = zero_mean_sq_183_cast_fp16)[name = tensor("op_6708_cast_fp16")]; tensor var_6709_to_fp16 = const()[name = tensor("op_6709_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6710_cast_fp16 = add(x = var_6708_cast_fp16, y = var_6709_to_fp16)[name = tensor("op_6710_cast_fp16")]; tensor denom_183_epsilon_0 = const()[name = tensor("denom_183_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_183_cast_fp16 = rsqrt(epsilon = denom_183_epsilon_0, x = var_6710_cast_fp16)[name = tensor("denom_183_cast_fp16")]; tensor out_183_cast_fp16 = mul(x = zero_mean_183_cast_fp16, y = denom_183_cast_fp16)[name = tensor("out_183_cast_fp16")]; tensor obj_369_gamma_0_to_fp16 = const()[name = tensor("obj_369_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(774984000)))]; tensor obj_369_beta_0_to_fp16 = const()[name = tensor("obj_369_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(774986624)))]; tensor obj_369_epsilon_0_to_fp16 = const()[name = tensor("obj_369_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_369_cast_fp16 = batch_norm(beta = obj_369_beta_0_to_fp16, epsilon = obj_369_epsilon_0_to_fp16, gamma = obj_369_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_183_cast_fp16)[name = tensor("obj_369_cast_fp16")]; tensor var_6725 = const()[name = tensor("op_6725"), val = tensor([1, 1])]; tensor var_6727 = const()[name = tensor("op_6727"), val = tensor([1, 1])]; tensor query_123_pad_type_0 = const()[name = tensor("query_123_pad_type_0"), val = tensor("custom")]; tensor query_123_pad_0 = const()[name = tensor("query_123_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_30_encoder_attn_q_proj_weight_to_fp16 = const()[name = tensor("layers_30_encoder_attn_q_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(774989248)))]; tensor layers_30_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_30_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(778266112)))]; tensor query_123_cast_fp16 = conv(bias = layers_30_encoder_attn_q_proj_bias_to_fp16, dilations = var_6727, groups = var_6603, pad = query_123_pad_0, pad_type = query_123_pad_type_0, strides = var_6725, weight = layers_30_encoder_attn_q_proj_weight_to_fp16, x = obj_369_cast_fp16)[name = tensor("query_123_cast_fp16")]; tensor var_6731 = const()[name = tensor("op_6731"), val = tensor([1, 1])]; tensor var_6733 = const()[name = tensor("op_6733"), val = tensor([1, 1])]; tensor key_123_pad_type_0 = const()[name = tensor("key_123_pad_type_0"), val = tensor("custom")]; tensor key_123_pad_0 = const()[name = tensor("key_123_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_30_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(778268736))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(779497600))), name = tensor("layers_30_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_123_cast_fp16 = conv(dilations = var_6733, groups = var_6603, pad = key_123_pad_0, pad_type = key_123_pad_type_0, strides = var_6731, weight = layers_30_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_123_cast_fp16")]; tensor var_6738 = const()[name = tensor("op_6738"), val = tensor([1, 1])]; tensor var_6740 = const()[name = tensor("op_6740"), val = tensor([1, 1])]; tensor value_123_pad_type_0 = const()[name = tensor("value_123_pad_type_0"), val = tensor("custom")]; tensor value_123_pad_0 = const()[name = tensor("value_123_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_30_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(779497792))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(780726656))), name = tensor("layers_30_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_30_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_30_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(780726848)))]; tensor value_123_cast_fp16 = conv(bias = layers_30_encoder_attn_v_proj_bias_to_fp16, dilations = var_6740, groups = var_6603, pad = value_123_pad_0, pad_type = value_123_pad_type_0, strides = var_6738, weight = layers_30_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_123_cast_fp16")]; tensor var_6744 = const()[name = tensor("op_6744"), val = tensor([1, 20, 64, -1])]; tensor var_6745_cast_fp16 = reshape(shape = var_6744, x = query_123_cast_fp16)[name = tensor("op_6745_cast_fp16")]; tensor var_6746_to_fp16 = const()[name = tensor("op_6746_to_fp16"), val = tensor(0x1p-3)]; tensor var_6747_cast_fp16 = mul(x = var_6745_cast_fp16, y = var_6746_to_fp16)[name = tensor("op_6747_cast_fp16")]; tensor var_6748 = const()[name = tensor("op_6748"), val = tensor([1, 20, 64, -1])]; tensor var_6749_cast_fp16 = reshape(shape = var_6748, x = key_123_cast_fp16)[name = tensor("op_6749_cast_fp16")]; tensor mh_w_185_transpose_x_0 = const()[name = tensor("mh_w_185_transpose_x_0"), val = tensor(true)]; tensor mh_w_185_transpose_y_0 = const()[name = tensor("mh_w_185_transpose_y_0"), val = tensor(false)]; tensor mh_w_185_cast_fp16 = matmul(transpose_x = mh_w_185_transpose_x_0, transpose_y = mh_w_185_transpose_y_0, x = var_6747_cast_fp16, y = var_6749_cast_fp16)[name = tensor("mh_w_185_cast_fp16")]; tensor var_6752_cast_fp16 = softmax(axis = var_6596, x = mh_w_185_cast_fp16)[name = tensor("op_6752_cast_fp16")]; tensor var_6753 = const()[name = tensor("op_6753"), val = tensor([1, 20, 64, -1])]; tensor var_6754_cast_fp16 = reshape(shape = var_6753, x = value_123_cast_fp16)[name = tensor("op_6754_cast_fp16")]; tensor attn_123_transpose_x_0 = const()[name = tensor("attn_123_transpose_x_0"), val = tensor(false)]; tensor attn_123_transpose_y_0 = const()[name = tensor("attn_123_transpose_y_0"), val = tensor(true)]; tensor attn_123_cast_fp16 = matmul(transpose_x = attn_123_transpose_x_0, transpose_y = attn_123_transpose_y_0, x = var_6754_cast_fp16, y = var_6752_cast_fp16)[name = tensor("attn_123_cast_fp16")]; tensor var_6757 = const()[name = tensor("op_6757"), val = tensor([1, 1280, 1, -1])]; tensor input_303_cast_fp16 = reshape(shape = var_6757, x = attn_123_cast_fp16)[name = tensor("input_303_cast_fp16")]; tensor var_6761 = const()[name = tensor("op_6761"), val = tensor([1, 1])]; tensor var_6763 = const()[name = tensor("op_6763"), val = tensor([1, 1])]; tensor obj_371_pad_type_0 = const()[name = tensor("obj_371_pad_type_0"), val = tensor("custom")]; tensor obj_371_pad_0 = const()[name = tensor("obj_371_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_30_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(780729472))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(781958336))), name = tensor("layers_30_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_30_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_30_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(781958528)))]; tensor obj_371_cast_fp16 = conv(bias = layers_30_encoder_attn_o_proj_bias_to_fp16, dilations = var_6763, groups = var_6603, pad = obj_371_pad_0, pad_type = obj_371_pad_type_0, strides = var_6761, weight = layers_30_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_303_cast_fp16)[name = tensor("obj_371_cast_fp16")]; tensor inputs_185_cast_fp16 = add(x = inputs_183_cast_fp16, y = obj_371_cast_fp16)[name = tensor("inputs_185_cast_fp16")]; tensor var_6769 = const()[name = tensor("op_6769"), val = tensor([1])]; tensor channels_mean_185_cast_fp16 = reduce_mean(axes = var_6769, keep_dims = var_6604, x = inputs_185_cast_fp16)[name = tensor("channels_mean_185_cast_fp16")]; tensor zero_mean_185_cast_fp16 = sub(x = inputs_185_cast_fp16, y = channels_mean_185_cast_fp16)[name = tensor("zero_mean_185_cast_fp16")]; tensor zero_mean_sq_185_cast_fp16 = mul(x = zero_mean_185_cast_fp16, y = zero_mean_185_cast_fp16)[name = tensor("zero_mean_sq_185_cast_fp16")]; tensor var_6773 = const()[name = tensor("op_6773"), val = tensor([1])]; tensor var_6774_cast_fp16 = reduce_mean(axes = var_6773, keep_dims = var_6604, x = zero_mean_sq_185_cast_fp16)[name = tensor("op_6774_cast_fp16")]; tensor var_6775_to_fp16 = const()[name = tensor("op_6775_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6776_cast_fp16 = add(x = var_6774_cast_fp16, y = var_6775_to_fp16)[name = tensor("op_6776_cast_fp16")]; tensor denom_185_epsilon_0 = const()[name = tensor("denom_185_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_185_cast_fp16 = rsqrt(epsilon = denom_185_epsilon_0, x = var_6776_cast_fp16)[name = tensor("denom_185_cast_fp16")]; tensor out_185_cast_fp16 = mul(x = zero_mean_185_cast_fp16, y = denom_185_cast_fp16)[name = tensor("out_185_cast_fp16")]; tensor input_305_gamma_0_to_fp16 = const()[name = tensor("input_305_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(781961152)))]; tensor input_305_beta_0_to_fp16 = const()[name = tensor("input_305_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(781963776)))]; tensor input_305_epsilon_0_to_fp16 = const()[name = tensor("input_305_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_305_cast_fp16 = batch_norm(beta = input_305_beta_0_to_fp16, epsilon = input_305_epsilon_0_to_fp16, gamma = input_305_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_185_cast_fp16)[name = tensor("input_305_cast_fp16")]; tensor var_6787 = const()[name = tensor("op_6787"), val = tensor([1, 1])]; tensor var_6789 = const()[name = tensor("op_6789"), val = tensor([1, 1])]; tensor input_307_pad_type_0 = const()[name = tensor("input_307_pad_type_0"), val = tensor("custom")]; tensor input_307_pad_0 = const()[name = tensor("input_307_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_30_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(781966400))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(786881664))), name = tensor("layers_30_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_30_fc1_bias_to_fp16 = const()[name = tensor("layers_30_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(786881856)))]; tensor input_307_cast_fp16 = conv(bias = layers_30_fc1_bias_to_fp16, dilations = var_6789, groups = var_6603, pad = input_307_pad_0, pad_type = input_307_pad_type_0, strides = var_6787, weight = layers_30_fc1_weight_to_fp16_palettized, x = input_305_cast_fp16)[name = tensor("input_307_cast_fp16")]; tensor input_309_mode_0 = const()[name = tensor("input_309_mode_0"), val = tensor("EXACT")]; tensor input_309_cast_fp16 = gelu(mode = input_309_mode_0, x = input_307_cast_fp16)[name = tensor("input_309_cast_fp16")]; tensor var_6795 = const()[name = tensor("op_6795"), val = tensor([1, 1])]; tensor var_6797 = const()[name = tensor("op_6797"), val = tensor([1, 1])]; tensor hidden_states_63_pad_type_0 = const()[name = tensor("hidden_states_63_pad_type_0"), val = tensor("custom")]; tensor hidden_states_63_pad_0 = const()[name = tensor("hidden_states_63_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_30_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(786892160))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(791807424))), name = tensor("layers_30_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_30_fc2_bias_to_fp16 = const()[name = tensor("layers_30_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(791807616)))]; tensor hidden_states_63_cast_fp16 = conv(bias = layers_30_fc2_bias_to_fp16, dilations = var_6797, groups = var_6603, pad = hidden_states_63_pad_0, pad_type = hidden_states_63_pad_type_0, strides = var_6795, weight = layers_30_fc2_weight_to_fp16_palettized, x = input_309_cast_fp16)[name = tensor("hidden_states_63_cast_fp16")]; tensor inputs_187_cast_fp16 = add(x = inputs_185_cast_fp16, y = hidden_states_63_cast_fp16)[name = tensor("inputs_187_cast_fp16")]; tensor var_6810 = const()[name = tensor("op_6810"), val = tensor(3)]; tensor var_6817 = const()[name = tensor("op_6817"), val = tensor(1)]; tensor var_6818 = const()[name = tensor("op_6818"), val = tensor(true)]; tensor var_6830 = const()[name = tensor("op_6830"), val = tensor([1])]; tensor channels_mean_187_cast_fp16 = reduce_mean(axes = var_6830, keep_dims = var_6818, x = inputs_187_cast_fp16)[name = tensor("channels_mean_187_cast_fp16")]; tensor zero_mean_187_cast_fp16 = sub(x = inputs_187_cast_fp16, y = channels_mean_187_cast_fp16)[name = tensor("zero_mean_187_cast_fp16")]; tensor zero_mean_sq_187_cast_fp16 = mul(x = zero_mean_187_cast_fp16, y = zero_mean_187_cast_fp16)[name = tensor("zero_mean_sq_187_cast_fp16")]; tensor var_6834 = const()[name = tensor("op_6834"), val = tensor([1])]; tensor var_6835_cast_fp16 = reduce_mean(axes = var_6834, keep_dims = var_6818, x = zero_mean_sq_187_cast_fp16)[name = tensor("op_6835_cast_fp16")]; tensor var_6836_to_fp16 = const()[name = tensor("op_6836_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6837_cast_fp16 = add(x = var_6835_cast_fp16, y = var_6836_to_fp16)[name = tensor("op_6837_cast_fp16")]; tensor denom_187_epsilon_0 = const()[name = tensor("denom_187_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_187_cast_fp16 = rsqrt(epsilon = denom_187_epsilon_0, x = var_6837_cast_fp16)[name = tensor("denom_187_cast_fp16")]; tensor out_187_cast_fp16 = mul(x = zero_mean_187_cast_fp16, y = denom_187_cast_fp16)[name = tensor("out_187_cast_fp16")]; tensor obj_373_gamma_0_to_fp16 = const()[name = tensor("obj_373_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(791810240)))]; tensor obj_373_beta_0_to_fp16 = const()[name = tensor("obj_373_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(791812864)))]; tensor obj_373_epsilon_0_to_fp16 = const()[name = tensor("obj_373_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_373_cast_fp16 = batch_norm(beta = obj_373_beta_0_to_fp16, epsilon = obj_373_epsilon_0_to_fp16, gamma = obj_373_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_187_cast_fp16)[name = tensor("obj_373_cast_fp16")]; tensor var_6852 = const()[name = tensor("op_6852"), val = tensor([1, 1])]; tensor var_6854 = const()[name = tensor("op_6854"), val = tensor([1, 1])]; tensor query_125_pad_type_0 = const()[name = tensor("query_125_pad_type_0"), val = tensor("custom")]; tensor query_125_pad_0 = const()[name = tensor("query_125_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_31_self_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(791815488))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(792634752))), name = tensor("layers_31_self_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_31_self_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_31_self_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(792634880)))]; tensor query_125_cast_fp16 = conv(bias = layers_31_self_attn_q_proj_bias_to_fp16, dilations = var_6854, groups = var_6817, pad = query_125_pad_0, pad_type = query_125_pad_type_0, strides = var_6852, weight = layers_31_self_attn_q_proj_weight_to_fp16_palettized, x = obj_373_cast_fp16)[name = tensor("query_125_cast_fp16")]; tensor var_6858 = const()[name = tensor("op_6858"), val = tensor([1, 1])]; tensor var_6860 = const()[name = tensor("op_6860"), val = tensor([1, 1])]; tensor current_key_pad_type_0 = const()[name = tensor("current_key_pad_type_0"), val = tensor("custom")]; tensor current_key_pad_0 = const()[name = tensor("current_key_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_31_self_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(792637504))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(793456768))), name = tensor("layers_31_self_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor current_key_cast_fp16 = conv(dilations = var_6860, groups = var_6817, pad = current_key_pad_0, pad_type = current_key_pad_type_0, strides = var_6858, weight = layers_31_self_attn_k_proj_weight_to_fp16_palettized, x = obj_373_cast_fp16)[name = tensor("current_key_cast_fp16")]; tensor var_6865 = const()[name = tensor("op_6865"), val = tensor([1, 1])]; tensor var_6867 = const()[name = tensor("op_6867"), val = tensor([1, 1])]; tensor current_value_pad_type_0 = const()[name = tensor("current_value_pad_type_0"), val = tensor("custom")]; tensor current_value_pad_0 = const()[name = tensor("current_value_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_31_self_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(793456896))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(794276160))), name = tensor("layers_31_self_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_31_self_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_31_self_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(794276288)))]; tensor current_value_cast_fp16 = conv(bias = layers_31_self_attn_v_proj_bias_to_fp16, dilations = var_6867, groups = var_6817, pad = current_value_pad_0, pad_type = current_value_pad_type_0, strides = var_6865, weight = layers_31_self_attn_v_proj_weight_to_fp16_palettized, x = obj_373_cast_fp16)[name = tensor("current_value_cast_fp16")]; tensor var_6874_cast_fp16 = mul(x = current_key_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_6874_cast_fp16")]; tensor var_6876_cast_fp16 = mul(x = var_103_cast_fp16_31, y = var_241_cast_fp16)[name = tensor("op_6876_cast_fp16")]; tensor key_125_cast_fp16 = add(x = var_6874_cast_fp16, y = var_6876_cast_fp16)[name = tensor("key_125_cast_fp16")]; tensor var_6878_cast_fp16 = mul(x = current_value_cast_fp16, y = var_238_cast_fp16)[name = tensor("op_6878_cast_fp16")]; tensor var_6880_cast_fp16 = mul(x = var_138_cast_fp16_31, y = var_241_cast_fp16)[name = tensor("op_6880_cast_fp16")]; tensor value_125_cast_fp16 = add(x = var_6878_cast_fp16, y = var_6880_cast_fp16)[name = tensor("value_125_cast_fp16")]; tensor var_6883 = const()[name = tensor("op_6883"), val = tensor([1, 20, 64, -1])]; tensor var_6884_cast_fp16 = reshape(shape = var_6883, x = query_125_cast_fp16)[name = tensor("op_6884_cast_fp16")]; tensor var_6885_to_fp16 = const()[name = tensor("op_6885_to_fp16"), val = tensor(0x1p-3)]; tensor var_6886_cast_fp16 = mul(x = var_6884_cast_fp16, y = var_6885_to_fp16)[name = tensor("op_6886_cast_fp16")]; tensor var_6887 = const()[name = tensor("op_6887"), val = tensor([1, 20, 64, -1])]; tensor var_6888_cast_fp16 = reshape(shape = var_6887, x = key_125_cast_fp16)[name = tensor("op_6888_cast_fp16")]; tensor mh_w_187_transpose_x_0 = const()[name = tensor("mh_w_187_transpose_x_0"), val = tensor(true)]; tensor mh_w_187_transpose_y_0 = const()[name = tensor("mh_w_187_transpose_y_0"), val = tensor(false)]; tensor mh_w_187_cast_fp16 = matmul(transpose_x = mh_w_187_transpose_x_0, transpose_y = mh_w_187_transpose_y_0, x = var_6886_cast_fp16, y = var_6888_cast_fp16)[name = tensor("mh_w_187_cast_fp16")]; tensor mh_w_189_cast_fp16 = add(x = mh_w_187_cast_fp16, y = var_259_cast_fp16)[name = tensor("mh_w_189_cast_fp16")]; tensor var_6896_cast_fp16 = softmax(axis = var_6810, x = mh_w_189_cast_fp16)[name = tensor("op_6896_cast_fp16")]; tensor var_6897 = const()[name = tensor("op_6897"), val = tensor([1, 20, 64, -1])]; tensor var_6898_cast_fp16 = reshape(shape = var_6897, x = value_125_cast_fp16)[name = tensor("op_6898_cast_fp16")]; tensor attn_125_transpose_x_0 = const()[name = tensor("attn_125_transpose_x_0"), val = tensor(false)]; tensor attn_125_transpose_y_0 = const()[name = tensor("attn_125_transpose_y_0"), val = tensor(true)]; tensor attn_125_cast_fp16 = matmul(transpose_x = attn_125_transpose_x_0, transpose_y = attn_125_transpose_y_0, x = var_6898_cast_fp16, y = var_6896_cast_fp16)[name = tensor("attn_125_cast_fp16")]; tensor var_6901 = const()[name = tensor("op_6901"), val = tensor([1, 1280, 1, -1])]; tensor input_311_cast_fp16 = reshape(shape = var_6901, x = attn_125_cast_fp16)[name = tensor("input_311_cast_fp16")]; tensor var_6905 = const()[name = tensor("op_6905"), val = tensor([1, 1])]; tensor var_6907 = const()[name = tensor("op_6907"), val = tensor([1, 1])]; tensor obj_379_pad_type_0 = const()[name = tensor("obj_379_pad_type_0"), val = tensor("custom")]; tensor obj_379_pad_0 = const()[name = tensor("obj_379_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_31_self_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(794278912))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(795098176))), name = tensor("layers_31_self_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_31_self_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_31_self_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(795098304)))]; tensor obj_379_cast_fp16 = conv(bias = layers_31_self_attn_o_proj_bias_to_fp16, dilations = var_6907, groups = var_6817, pad = obj_379_pad_0, pad_type = obj_379_pad_type_0, strides = var_6905, weight = layers_31_self_attn_o_proj_weight_to_fp16_palettized, x = input_311_cast_fp16)[name = tensor("obj_379_cast_fp16")]; tensor inputs_189_cast_fp16 = add(x = inputs_187_cast_fp16, y = obj_379_cast_fp16)[name = tensor("inputs_189_cast_fp16")]; tensor var_6917 = const()[name = tensor("op_6917"), val = tensor([1])]; tensor channels_mean_189_cast_fp16 = reduce_mean(axes = var_6917, keep_dims = var_6818, x = inputs_189_cast_fp16)[name = tensor("channels_mean_189_cast_fp16")]; tensor zero_mean_189_cast_fp16 = sub(x = inputs_189_cast_fp16, y = channels_mean_189_cast_fp16)[name = tensor("zero_mean_189_cast_fp16")]; tensor zero_mean_sq_189_cast_fp16 = mul(x = zero_mean_189_cast_fp16, y = zero_mean_189_cast_fp16)[name = tensor("zero_mean_sq_189_cast_fp16")]; tensor var_6921 = const()[name = tensor("op_6921"), val = tensor([1])]; tensor var_6922_cast_fp16 = reduce_mean(axes = var_6921, keep_dims = var_6818, x = zero_mean_sq_189_cast_fp16)[name = tensor("op_6922_cast_fp16")]; tensor var_6923_to_fp16 = const()[name = tensor("op_6923_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6924_cast_fp16 = add(x = var_6922_cast_fp16, y = var_6923_to_fp16)[name = tensor("op_6924_cast_fp16")]; tensor denom_189_epsilon_0 = const()[name = tensor("denom_189_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_189_cast_fp16 = rsqrt(epsilon = denom_189_epsilon_0, x = var_6924_cast_fp16)[name = tensor("denom_189_cast_fp16")]; tensor out_189_cast_fp16 = mul(x = zero_mean_189_cast_fp16, y = denom_189_cast_fp16)[name = tensor("out_189_cast_fp16")]; tensor obj_381_gamma_0_to_fp16 = const()[name = tensor("obj_381_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(795100928)))]; tensor obj_381_beta_0_to_fp16 = const()[name = tensor("obj_381_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(795103552)))]; tensor obj_381_epsilon_0_to_fp16 = const()[name = tensor("obj_381_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor obj_381_cast_fp16 = batch_norm(beta = obj_381_beta_0_to_fp16, epsilon = obj_381_epsilon_0_to_fp16, gamma = obj_381_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_189_cast_fp16)[name = tensor("obj_381_cast_fp16")]; tensor var_6939 = const()[name = tensor("op_6939"), val = tensor([1, 1])]; tensor var_6941 = const()[name = tensor("op_6941"), val = tensor([1, 1])]; tensor query_pad_type_0 = const()[name = tensor("query_pad_type_0"), val = tensor("custom")]; tensor query_pad_0 = const()[name = tensor("query_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_31_encoder_attn_q_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(795106176))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(796335040))), name = tensor("layers_31_encoder_attn_q_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_31_encoder_attn_q_proj_bias_to_fp16 = const()[name = tensor("layers_31_encoder_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(796335232)))]; tensor query_cast_fp16 = conv(bias = layers_31_encoder_attn_q_proj_bias_to_fp16, dilations = var_6941, groups = var_6817, pad = query_pad_0, pad_type = query_pad_type_0, strides = var_6939, weight = layers_31_encoder_attn_q_proj_weight_to_fp16_palettized, x = obj_381_cast_fp16)[name = tensor("query_cast_fp16")]; tensor var_6945 = const()[name = tensor("op_6945"), val = tensor([1, 1])]; tensor var_6947 = const()[name = tensor("op_6947"), val = tensor([1, 1])]; tensor key_pad_type_0 = const()[name = tensor("key_pad_type_0"), val = tensor("custom")]; tensor key_pad_0 = const()[name = tensor("key_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_31_encoder_attn_k_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(796337856))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(797566720))), name = tensor("layers_31_encoder_attn_k_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor key_cast_fp16 = conv(dilations = var_6947, groups = var_6817, pad = key_pad_0, pad_type = key_pad_type_0, strides = var_6945, weight = layers_31_encoder_attn_k_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("key_cast_fp16")]; tensor var_6952 = const()[name = tensor("op_6952"), val = tensor([1, 1])]; tensor var_6954 = const()[name = tensor("op_6954"), val = tensor([1, 1])]; tensor value_pad_type_0 = const()[name = tensor("value_pad_type_0"), val = tensor("custom")]; tensor value_pad_0 = const()[name = tensor("value_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_31_encoder_attn_v_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(797566912))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(798795776))), name = tensor("layers_31_encoder_attn_v_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_31_encoder_attn_v_proj_bias_to_fp16 = const()[name = tensor("layers_31_encoder_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(798795968)))]; tensor value_cast_fp16 = conv(bias = layers_31_encoder_attn_v_proj_bias_to_fp16, dilations = var_6954, groups = var_6817, pad = value_pad_0, pad_type = value_pad_type_0, strides = var_6952, weight = layers_31_encoder_attn_v_proj_weight_to_fp16_palettized, x = encoder_output_embeds)[name = tensor("value_cast_fp16")]; tensor var_6958 = const()[name = tensor("op_6958"), val = tensor([1, 20, 64, -1])]; tensor var_6959_cast_fp16 = reshape(shape = var_6958, x = query_cast_fp16)[name = tensor("op_6959_cast_fp16")]; tensor var_6960_to_fp16 = const()[name = tensor("op_6960_to_fp16"), val = tensor(0x1p-3)]; tensor var_6961_cast_fp16 = mul(x = var_6959_cast_fp16, y = var_6960_to_fp16)[name = tensor("op_6961_cast_fp16")]; tensor var_6962 = const()[name = tensor("op_6962"), val = tensor([1, 20, 64, -1])]; tensor var_6963_cast_fp16 = reshape(shape = var_6962, x = key_cast_fp16)[name = tensor("op_6963_cast_fp16")]; tensor mh_w_transpose_x_0 = const()[name = tensor("mh_w_transpose_x_0"), val = tensor(true)]; tensor mh_w_transpose_y_0 = const()[name = tensor("mh_w_transpose_y_0"), val = tensor(false)]; tensor mh_w_cast_fp16 = matmul(transpose_x = mh_w_transpose_x_0, transpose_y = mh_w_transpose_y_0, x = var_6961_cast_fp16, y = var_6963_cast_fp16)[name = tensor("mh_w_cast_fp16")]; tensor var_6966_cast_fp16 = softmax(axis = var_6810, x = mh_w_cast_fp16)[name = tensor("op_6966_cast_fp16")]; tensor var_6967 = const()[name = tensor("op_6967"), val = tensor([1, 20, 64, -1])]; tensor var_6968_cast_fp16 = reshape(shape = var_6967, x = value_cast_fp16)[name = tensor("op_6968_cast_fp16")]; tensor attn_transpose_x_0 = const()[name = tensor("attn_transpose_x_0"), val = tensor(false)]; tensor attn_transpose_y_0 = const()[name = tensor("attn_transpose_y_0"), val = tensor(true)]; tensor attn_cast_fp16 = matmul(transpose_x = attn_transpose_x_0, transpose_y = attn_transpose_y_0, x = var_6968_cast_fp16, y = var_6966_cast_fp16)[name = tensor("attn_cast_fp16")]; tensor var_6971 = const()[name = tensor("op_6971"), val = tensor([1, 1280, 1, -1])]; tensor input_313_cast_fp16 = reshape(shape = var_6971, x = attn_cast_fp16)[name = tensor("input_313_cast_fp16")]; tensor var_6975 = const()[name = tensor("op_6975"), val = tensor([1, 1])]; tensor var_6977 = const()[name = tensor("op_6977"), val = tensor([1, 1])]; tensor obj_383_pad_type_0 = const()[name = tensor("obj_383_pad_type_0"), val = tensor("custom")]; tensor obj_383_pad_0 = const()[name = tensor("obj_383_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_31_encoder_attn_o_proj_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(798798592))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(800027456))), name = tensor("layers_31_encoder_attn_o_proj_weight_to_fp16_palettized"), shape = tensor([1280, 1280, 1, 1])]; tensor layers_31_encoder_attn_o_proj_bias_to_fp16 = const()[name = tensor("layers_31_encoder_attn_o_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(800027648)))]; tensor obj_383_cast_fp16 = conv(bias = layers_31_encoder_attn_o_proj_bias_to_fp16, dilations = var_6977, groups = var_6817, pad = obj_383_pad_0, pad_type = obj_383_pad_type_0, strides = var_6975, weight = layers_31_encoder_attn_o_proj_weight_to_fp16_palettized, x = input_313_cast_fp16)[name = tensor("obj_383_cast_fp16")]; tensor inputs_191_cast_fp16 = add(x = inputs_189_cast_fp16, y = obj_383_cast_fp16)[name = tensor("inputs_191_cast_fp16")]; tensor var_6983 = const()[name = tensor("op_6983"), val = tensor([1])]; tensor channels_mean_191_cast_fp16 = reduce_mean(axes = var_6983, keep_dims = var_6818, x = inputs_191_cast_fp16)[name = tensor("channels_mean_191_cast_fp16")]; tensor zero_mean_191_cast_fp16 = sub(x = inputs_191_cast_fp16, y = channels_mean_191_cast_fp16)[name = tensor("zero_mean_191_cast_fp16")]; tensor zero_mean_sq_191_cast_fp16 = mul(x = zero_mean_191_cast_fp16, y = zero_mean_191_cast_fp16)[name = tensor("zero_mean_sq_191_cast_fp16")]; tensor var_6987 = const()[name = tensor("op_6987"), val = tensor([1])]; tensor var_6988_cast_fp16 = reduce_mean(axes = var_6987, keep_dims = var_6818, x = zero_mean_sq_191_cast_fp16)[name = tensor("op_6988_cast_fp16")]; tensor var_6989_to_fp16 = const()[name = tensor("op_6989_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_6990_cast_fp16 = add(x = var_6988_cast_fp16, y = var_6989_to_fp16)[name = tensor("op_6990_cast_fp16")]; tensor denom_191_epsilon_0 = const()[name = tensor("denom_191_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_191_cast_fp16 = rsqrt(epsilon = denom_191_epsilon_0, x = var_6990_cast_fp16)[name = tensor("denom_191_cast_fp16")]; tensor out_191_cast_fp16 = mul(x = zero_mean_191_cast_fp16, y = denom_191_cast_fp16)[name = tensor("out_191_cast_fp16")]; tensor input_315_gamma_0_to_fp16 = const()[name = tensor("input_315_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(800030272)))]; tensor input_315_beta_0_to_fp16 = const()[name = tensor("input_315_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(800032896)))]; tensor input_315_epsilon_0_to_fp16 = const()[name = tensor("input_315_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor input_315_cast_fp16 = batch_norm(beta = input_315_beta_0_to_fp16, epsilon = input_315_epsilon_0_to_fp16, gamma = input_315_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_191_cast_fp16)[name = tensor("input_315_cast_fp16")]; tensor var_7001 = const()[name = tensor("op_7001"), val = tensor([1, 1])]; tensor var_7003 = const()[name = tensor("op_7003"), val = tensor([1, 1])]; tensor input_317_pad_type_0 = const()[name = tensor("input_317_pad_type_0"), val = tensor("custom")]; tensor input_317_pad_0 = const()[name = tensor("input_317_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_31_fc1_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(800035520))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(804950784))), name = tensor("layers_31_fc1_weight_to_fp16_palettized"), shape = tensor([5120, 1280, 1, 1])]; tensor layers_31_fc1_bias_to_fp16 = const()[name = tensor("layers_31_fc1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(804950976)))]; tensor input_317_cast_fp16 = conv(bias = layers_31_fc1_bias_to_fp16, dilations = var_7003, groups = var_6817, pad = input_317_pad_0, pad_type = input_317_pad_type_0, strides = var_7001, weight = layers_31_fc1_weight_to_fp16_palettized, x = input_315_cast_fp16)[name = tensor("input_317_cast_fp16")]; tensor input_mode_0 = const()[name = tensor("input_mode_0"), val = tensor("EXACT")]; tensor input_cast_fp16 = gelu(mode = input_mode_0, x = input_317_cast_fp16)[name = tensor("input_cast_fp16")]; tensor var_7009 = const()[name = tensor("op_7009"), val = tensor([1, 1])]; tensor var_7011 = const()[name = tensor("op_7011"), val = tensor([1, 1])]; tensor hidden_states_65_pad_type_0 = const()[name = tensor("hidden_states_65_pad_type_0"), val = tensor("custom")]; tensor hidden_states_65_pad_0 = const()[name = tensor("hidden_states_65_pad_0"), val = tensor([0, 0, 0, 0])]; tensor layers_31_fc2_weight_to_fp16_palettized = constexpr_lut_to_dense()[indices = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(804961280))), lut = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(809876544))), name = tensor("layers_31_fc2_weight_to_fp16_palettized"), shape = tensor([1280, 5120, 1, 1])]; tensor layers_31_fc2_bias_to_fp16 = const()[name = tensor("layers_31_fc2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(809876736)))]; tensor hidden_states_65_cast_fp16 = conv(bias = layers_31_fc2_bias_to_fp16, dilations = var_7011, groups = var_6817, pad = hidden_states_65_pad_0, pad_type = hidden_states_65_pad_type_0, strides = var_7009, weight = layers_31_fc2_weight_to_fp16_palettized, x = input_cast_fp16)[name = tensor("hidden_states_65_cast_fp16")]; tensor inputs_cast_fp16 = add(x = inputs_191_cast_fp16, y = hidden_states_65_cast_fp16)[name = tensor("inputs_cast_fp16")]; tensor var_7021 = const()[name = tensor("op_7021"), val = tensor(true)]; tensor var_7025 = const()[name = tensor("op_7025"), val = tensor([1])]; tensor channels_mean_cast_fp16 = reduce_mean(axes = var_7025, keep_dims = var_7021, x = inputs_cast_fp16)[name = tensor("channels_mean_cast_fp16")]; tensor zero_mean_cast_fp16 = sub(x = inputs_cast_fp16, y = channels_mean_cast_fp16)[name = tensor("zero_mean_cast_fp16")]; tensor zero_mean_sq_cast_fp16 = mul(x = zero_mean_cast_fp16, y = zero_mean_cast_fp16)[name = tensor("zero_mean_sq_cast_fp16")]; tensor var_7029 = const()[name = tensor("op_7029"), val = tensor([1])]; tensor var_7030_cast_fp16 = reduce_mean(axes = var_7029, keep_dims = var_7021, x = zero_mean_sq_cast_fp16)[name = tensor("op_7030_cast_fp16")]; tensor var_7031_to_fp16 = const()[name = tensor("op_7031_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_7032_cast_fp16 = add(x = var_7030_cast_fp16, y = var_7031_to_fp16)[name = tensor("op_7032_cast_fp16")]; tensor denom_epsilon_0 = const()[name = tensor("denom_epsilon_0"), val = tensor(0x1.197998p-40)]; tensor denom_cast_fp16 = rsqrt(epsilon = denom_epsilon_0, x = var_7032_cast_fp16)[name = tensor("denom_cast_fp16")]; tensor out_cast_fp16 = mul(x = zero_mean_cast_fp16, y = denom_cast_fp16)[name = tensor("out_cast_fp16")]; tensor hidden_states_gamma_0_to_fp16 = const()[name = tensor("hidden_states_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(809879360)))]; tensor hidden_states_beta_0_to_fp16 = const()[name = tensor("hidden_states_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(809881984)))]; tensor hidden_states_epsilon_0_to_fp16 = const()[name = tensor("hidden_states_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor hidden_states_cast_fp16 = batch_norm(beta = hidden_states_beta_0_to_fp16, epsilon = hidden_states_epsilon_0_to_fp16, gamma = hidden_states_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_cast_fp16)[name = tensor("hidden_states_cast_fp16")]; tensor var_7042_axes_0 = const()[name = tensor("op_7042_axes_0"), val = tensor([2])]; tensor var_7042_cast_fp16 = squeeze(axes = var_7042_axes_0, x = hidden_states_cast_fp16)[name = tensor("op_7042_cast_fp16")]; tensor var_7045_perm_0 = const()[name = tensor("op_7045_perm_0"), val = tensor([0, 2, 1])]; tensor linear_0_bias_0_to_fp16 = const()[name = tensor("linear_0_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(809884608)))]; tensor transpose_0 = transpose(perm = var_7045_perm_0, x = var_7042_cast_fp16)[name = tensor("transpose_0")]; tensor logits = linear(bias = linear_0_bias_0_to_fp16, weight = embed_tokens_weight_to_fp16, x = transpose_0)[name = tensor("linear_0_cast_fp16")]; tensor var_7049 = const()[name = tensor("op_7049"), val = tensor(1)]; tensor obj_387_interleave_0 = const()[name = tensor("obj_387_interleave_0"), val = tensor(false)]; tensor key_cache_updates = concat(axis = var_7049, interleave = obj_387_interleave_0, values = (current_key_1_cast_fp16, current_key_3_cast_fp16, current_key_5_cast_fp16, current_key_7_cast_fp16, current_key_9_cast_fp16, current_key_11_cast_fp16, current_key_13_cast_fp16, current_key_15_cast_fp16, current_key_17_cast_fp16, current_key_19_cast_fp16, current_key_21_cast_fp16, current_key_23_cast_fp16, current_key_25_cast_fp16, current_key_27_cast_fp16, current_key_29_cast_fp16, current_key_31_cast_fp16, current_key_33_cast_fp16, current_key_35_cast_fp16, current_key_37_cast_fp16, current_key_39_cast_fp16, current_key_41_cast_fp16, current_key_43_cast_fp16, current_key_45_cast_fp16, current_key_47_cast_fp16, current_key_49_cast_fp16, current_key_51_cast_fp16, current_key_53_cast_fp16, current_key_55_cast_fp16, current_key_57_cast_fp16, current_key_59_cast_fp16, current_key_61_cast_fp16, current_key_cast_fp16))[name = tensor("obj_387_cast_fp16")]; tensor var_7052 = const()[name = tensor("op_7052"), val = tensor(1)]; tensor obj_interleave_0 = const()[name = tensor("obj_interleave_0"), val = tensor(false)]; tensor value_cache_updates = concat(axis = var_7052, interleave = obj_interleave_0, values = (current_value_1_cast_fp16, current_value_3_cast_fp16, current_value_5_cast_fp16, current_value_7_cast_fp16, current_value_9_cast_fp16, current_value_11_cast_fp16, current_value_13_cast_fp16, current_value_15_cast_fp16, current_value_17_cast_fp16, current_value_19_cast_fp16, current_value_21_cast_fp16, current_value_23_cast_fp16, current_value_25_cast_fp16, current_value_27_cast_fp16, current_value_29_cast_fp16, current_value_31_cast_fp16, current_value_33_cast_fp16, current_value_35_cast_fp16, current_value_37_cast_fp16, current_value_39_cast_fp16, current_value_41_cast_fp16, current_value_43_cast_fp16, current_value_45_cast_fp16, current_value_47_cast_fp16, current_value_49_cast_fp16, current_value_51_cast_fp16, current_value_53_cast_fp16, current_value_55_cast_fp16, current_value_57_cast_fp16, current_value_59_cast_fp16, current_value_61_cast_fp16, current_value_cast_fp16))[name = tensor("obj_cast_fp16")]; } -> (logits, key_cache_updates, value_cache_updates); }