program(1.3) [buildInfo = dict({{"coremlc-component-MIL", "3400.23.1"}, {"coremlc-version", "3400.24.1"}}), mldb_token = string("mldb-5qbg63zgxe")] { func main(tensor mlm_input) { int32 var_6 = const()[name = string("op_6"), val = int32(0)]; tensor var_13 = const()[name = string("op_13"), val = tensor([1, 1, 1])]; int32 var_14_axis_0 = const()[name = string("op_14_axis_0"), val = int32(-1)]; tensor var_14_0, tensor var_14_1, tensor var_14_2 = split(axis = var_14_axis_0, split_sizes = var_13, x = mlm_input)[name = string("op_14")]; tensor var_18_axes_0 = const()[name = string("op_18_axes_0"), val = tensor([-1])]; tensor var_18 = squeeze(axes = var_18_axes_0, x = var_14_0)[name = string("op_18")]; tensor tok_ids_1_axes_0 = const()[name = string("tok_ids_1_axes_0"), val = tensor([-1])]; tensor tok_ids_1 = squeeze(axes = tok_ids_1_axes_0, x = var_18)[name = string("tok_ids_1")]; tensor var_20_axes_0 = const()[name = string("op_20_axes_0"), val = tensor([-1])]; tensor var_20 = squeeze(axes = var_20_axes_0, x = var_14_1)[name = string("op_20")]; tensor var_22_axes_0 = const()[name = string("op_22_axes_0"), val = tensor([-1])]; tensor var_22 = squeeze(axes = var_22_axes_0, x = var_14_2)[name = string("op_22")]; tensor var_24 = not_equal(x = tok_ids_1, y = var_6)[name = string("op_24")]; fp16 var_8_to_fp16 = const()[name = string("op_8_to_fp16"), val = fp16(0x1p+0)]; string var_24_to_fp32_to_fp16_dtype_0 = const()[name = string("op_24_to_fp32_to_fp16_dtype_0"), val = string("fp16")]; tensor cast_1 = cast(dtype = var_24_to_fp32_to_fp16_dtype_0, x = var_24)[name = string("cast_1")]; tensor var_29_cast_fp16 = sub(x = var_8_to_fp16, y = cast_1)[name = string("op_29_cast_fp16")]; fp16 var_30_to_fp16 = const()[name = string("op_30_to_fp16"), val = fp16(-0x1.388p+13)]; tensor padding_mask0_1_cast_fp16 = mul(x = var_29_cast_fp16, y = var_30_to_fp16)[name = string("padding_mask0_1_cast_fp16")]; tensor var_32 = const()[name = string("op_32"), val = tensor([-1, 256, 1, 1])]; tensor var_33_cast_fp16 = reshape(shape = var_32, x = padding_mask0_1_cast_fp16)[name = string("op_33_cast_fp16")]; int32 var_46 = const()[name = string("op_46"), val = int32(1)]; int32 var_47 = const()[name = string("op_47"), val = int32(2)]; tensor input_6_axes_0 = const()[name = string("input_6_axes_0"), val = tensor([2])]; tensor input_6 = expand_dims(axes = input_6_axes_0, x = tok_ids_1)[name = string("input_6")]; int32 var_54_axis_0 = const()[name = string("op_54_axis_0"), val = int32(0)]; tensor nlp_net_default_encoder_tok_embed_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_tok_embed_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(64))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(17955200))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(17920128)))]; int32 op_54_cast_fp16_batch_dims_0 = const()[name = string("op_54_cast_fp16_batch_dims_0"), val = int32(0)]; tensor var_54_cast_fp16 = gather(axis = var_54_axis_0, batch_dims = op_54_cast_fp16_batch_dims_0, indices = input_6, x = nlp_net_default_encoder_tok_embed_weight_to_fp16_affine_quantized)[name = string("op_54_cast_fp16")]; int32 var_57_axis_0 = const()[name = string("op_57_axis_0"), val = int32(0)]; tensor nlp_net_default_encoder_pos_embed_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_pos_embed_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18025280))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18156736))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18156416)))]; int32 op_57_cast_fp16_batch_dims_0 = const()[name = string("op_57_cast_fp16_batch_dims_0"), val = int32(0)]; tensor var_57_cast_fp16 = gather(axis = var_57_axis_0, batch_dims = op_57_cast_fp16_batch_dims_0, indices = var_20, x = nlp_net_default_encoder_pos_embed_weight_to_fp16_affine_quantized)[name = string("op_57_cast_fp16")]; int32 var_60_axis_0 = const()[name = string("op_60_axis_0"), val = int32(0)]; tensor nlp_net_default_encoder_seg_embed_weight_to_fp16 = const()[name = string("nlp_net_default_encoder_seg_embed_weight_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18157312)))]; int32 op_60_cast_fp16_batch_dims_0 = const()[name = string("op_60_cast_fp16_batch_dims_0"), val = int32(0)]; tensor var_60_cast_fp16 = gather(axis = var_60_axis_0, batch_dims = op_60_cast_fp16_batch_dims_0, indices = var_22, x = nlp_net_default_encoder_seg_embed_weight_to_fp16)[name = string("op_60_cast_fp16")]; tensor var_62_cast_fp16 = add(x = var_54_cast_fp16, y = var_57_cast_fp16)[name = string("op_62_cast_fp16")]; tensor var_63_cast_fp16 = add(x = var_62_cast_fp16, y = var_60_cast_fp16)[name = string("op_63_cast_fp16")]; tensor t_1_perm_0 = const()[name = string("t_1_perm_0"), val = tensor([0, 3, 2, 1])]; tensor k_3_axes_0 = const()[name = string("k_3_axes_0"), val = tensor([1])]; tensor k_3_gamma_0_to_fp16 = const()[name = string("k_3_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18158400)))]; tensor k_3_beta_0_to_fp16 = const()[name = string("k_3_beta_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18159488)))]; fp16 var_94_to_fp16 = const()[name = string("op_94_to_fp16"), val = fp16(0x1.5p-17)]; tensor transpose_9 = transpose(perm = t_1_perm_0, x = var_63_cast_fp16)[name = string("transpose_9")]; tensor k_3_cast_fp16 = layer_norm(axes = k_3_axes_0, beta = k_3_beta_0_to_fp16, epsilon = var_94_to_fp16, gamma = k_3_gamma_0_to_fp16, x = transpose_9)[name = string("k_3_cast_fp16")]; tensor var_113 = const()[name = string("op_113"), val = tensor([1, 1])]; tensor var_115 = const()[name = string("op_115"), val = tensor([1, 1])]; string var_117_pad_type_0 = const()[name = string("op_117_pad_type_0"), val = string("custom")]; tensor var_117_pad_0 = const()[name = string("op_117_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_0_attn_q_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_0_attn_q_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18160576))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18423360))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18422784)))]; tensor nlp_net_default_encoder_transformer_layers_0_attn_q_proj_bias_to_fp16 = const()[name = string("nlp_net_default_encoder_transformer_layers_0_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18424448)))]; tensor var_117_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_0_attn_q_proj_bias_to_fp16, dilations = var_115, groups = var_46, pad = var_117_pad_0, pad_type = var_117_pad_type_0, strides = var_113, weight = nlp_net_default_encoder_transformer_layers_0_attn_q_proj_weight_to_fp16_affine_quantized, x = k_3_cast_fp16)[name = string("op_117_cast_fp16")]; tensor var_120 = const()[name = string("op_120"), val = tensor([1, 1])]; tensor var_122 = const()[name = string("op_122"), val = tensor([1, 1])]; string k_5_pad_type_0 = const()[name = string("k_5_pad_type_0"), val = string("custom")]; tensor k_5_pad_0 = const()[name = string("k_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_0_attn_k_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_0_attn_k_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18425536))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18688320))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18687744)))]; tensor nlp_net_default_encoder_transformer_layers_0_attn_k_proj_bias_to_fp16 = const()[name = string("nlp_net_default_encoder_transformer_layers_0_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18689408)))]; tensor k_5_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_0_attn_k_proj_bias_to_fp16, dilations = var_122, groups = var_46, pad = k_5_pad_0, pad_type = k_5_pad_type_0, strides = var_120, weight = nlp_net_default_encoder_transformer_layers_0_attn_k_proj_weight_to_fp16_affine_quantized, x = k_3_cast_fp16)[name = string("k_5_cast_fp16")]; tensor var_127 = const()[name = string("op_127"), val = tensor([1, 1])]; tensor var_129 = const()[name = string("op_129"), val = tensor([1, 1])]; string var_131_pad_type_0 = const()[name = string("op_131_pad_type_0"), val = string("custom")]; tensor var_131_pad_0 = const()[name = string("op_131_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_0_attn_v_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_0_attn_v_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18690496))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18953280))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18952704)))]; tensor nlp_net_default_encoder_transformer_layers_0_attn_v_proj_bias_to_fp16 = const()[name = string("nlp_net_default_encoder_transformer_layers_0_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18954368)))]; tensor var_131_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_0_attn_v_proj_bias_to_fp16, dilations = var_129, groups = var_46, pad = var_131_pad_0, pad_type = var_131_pad_type_0, strides = var_127, weight = nlp_net_default_encoder_transformer_layers_0_attn_v_proj_weight_to_fp16_affine_quantized, x = k_3_cast_fp16)[name = string("op_131_cast_fp16")]; tensor tile_0 = const()[name = string("tile_0"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; int32 var_132_axis_0 = const()[name = string("op_132_axis_0"), val = int32(1)]; tensor var_132_cast_fp16_0, tensor var_132_cast_fp16_1, tensor var_132_cast_fp16_2, tensor var_132_cast_fp16_3, tensor var_132_cast_fp16_4, tensor var_132_cast_fp16_5, tensor var_132_cast_fp16_6, tensor var_132_cast_fp16_7 = split(axis = var_132_axis_0, split_sizes = tile_0, x = var_117_cast_fp16)[name = string("op_132_cast_fp16")]; tensor var_141_perm_0 = const()[name = string("op_141_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_1 = const()[name = string("tile_1"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; int32 var_142_axis_0 = const()[name = string("op_142_axis_0"), val = int32(3)]; tensor transpose_8 = transpose(perm = var_141_perm_0, x = k_5_cast_fp16)[name = string("transpose_8")]; tensor var_142_cast_fp16_0, tensor var_142_cast_fp16_1, tensor var_142_cast_fp16_2, tensor var_142_cast_fp16_3, tensor var_142_cast_fp16_4, tensor var_142_cast_fp16_5, tensor var_142_cast_fp16_6, tensor var_142_cast_fp16_7 = split(axis = var_142_axis_0, split_sizes = tile_1, x = transpose_8)[name = string("op_142_cast_fp16")]; tensor tile_2 = const()[name = string("tile_2"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; int32 var_151_axis_0 = const()[name = string("op_151_axis_0"), val = int32(1)]; tensor var_151_cast_fp16_0, tensor var_151_cast_fp16_1, tensor var_151_cast_fp16_2, tensor var_151_cast_fp16_3, tensor var_151_cast_fp16_4, tensor var_151_cast_fp16_5, tensor var_151_cast_fp16_6, tensor var_151_cast_fp16_7 = split(axis = var_151_axis_0, split_sizes = tile_2, x = var_131_cast_fp16)[name = string("op_151_cast_fp16")]; string var_161_equation_0 = const()[name = string("op_161_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_161_cast_fp16 = einsum(equation = var_161_equation_0, values = (var_142_cast_fp16_0, var_132_cast_fp16_0))[name = string("op_161_cast_fp16")]; fp16 var_162_to_fp16 = const()[name = string("op_162_to_fp16"), val = fp16(0x1p-3)]; tensor var_163_cast_fp16 = mul(x = var_161_cast_fp16, y = var_162_to_fp16)[name = string("op_163_cast_fp16")]; string var_165_equation_0 = const()[name = string("op_165_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_165_cast_fp16 = einsum(equation = var_165_equation_0, values = (var_142_cast_fp16_1, var_132_cast_fp16_1))[name = string("op_165_cast_fp16")]; fp16 var_166_to_fp16 = const()[name = string("op_166_to_fp16"), val = fp16(0x1p-3)]; tensor var_167_cast_fp16 = mul(x = var_165_cast_fp16, y = var_166_to_fp16)[name = string("op_167_cast_fp16")]; string var_169_equation_0 = const()[name = string("op_169_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_169_cast_fp16 = einsum(equation = var_169_equation_0, values = (var_142_cast_fp16_2, var_132_cast_fp16_2))[name = string("op_169_cast_fp16")]; fp16 var_170_to_fp16 = const()[name = string("op_170_to_fp16"), val = fp16(0x1p-3)]; tensor var_171_cast_fp16 = mul(x = var_169_cast_fp16, y = var_170_to_fp16)[name = string("op_171_cast_fp16")]; string var_173_equation_0 = const()[name = string("op_173_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_173_cast_fp16 = einsum(equation = var_173_equation_0, values = (var_142_cast_fp16_3, var_132_cast_fp16_3))[name = string("op_173_cast_fp16")]; fp16 var_174_to_fp16 = const()[name = string("op_174_to_fp16"), val = fp16(0x1p-3)]; tensor var_175_cast_fp16 = mul(x = var_173_cast_fp16, y = var_174_to_fp16)[name = string("op_175_cast_fp16")]; string var_177_equation_0 = const()[name = string("op_177_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_177_cast_fp16 = einsum(equation = var_177_equation_0, values = (var_142_cast_fp16_4, var_132_cast_fp16_4))[name = string("op_177_cast_fp16")]; fp16 var_178_to_fp16 = const()[name = string("op_178_to_fp16"), val = fp16(0x1p-3)]; tensor var_179_cast_fp16 = mul(x = var_177_cast_fp16, y = var_178_to_fp16)[name = string("op_179_cast_fp16")]; string var_181_equation_0 = const()[name = string("op_181_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_181_cast_fp16 = einsum(equation = var_181_equation_0, values = (var_142_cast_fp16_5, var_132_cast_fp16_5))[name = string("op_181_cast_fp16")]; fp16 var_182_to_fp16 = const()[name = string("op_182_to_fp16"), val = fp16(0x1p-3)]; tensor var_183_cast_fp16 = mul(x = var_181_cast_fp16, y = var_182_to_fp16)[name = string("op_183_cast_fp16")]; string var_185_equation_0 = const()[name = string("op_185_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_185_cast_fp16 = einsum(equation = var_185_equation_0, values = (var_142_cast_fp16_6, var_132_cast_fp16_6))[name = string("op_185_cast_fp16")]; fp16 var_186_to_fp16 = const()[name = string("op_186_to_fp16"), val = fp16(0x1p-3)]; tensor var_187_cast_fp16 = mul(x = var_185_cast_fp16, y = var_186_to_fp16)[name = string("op_187_cast_fp16")]; string var_189_equation_0 = const()[name = string("op_189_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_189_cast_fp16 = einsum(equation = var_189_equation_0, values = (var_142_cast_fp16_7, var_132_cast_fp16_7))[name = string("op_189_cast_fp16")]; fp16 var_190_to_fp16 = const()[name = string("op_190_to_fp16"), val = fp16(0x1p-3)]; tensor var_191_cast_fp16 = mul(x = var_189_cast_fp16, y = var_190_to_fp16)[name = string("op_191_cast_fp16")]; bool attn_weights_2_interleave_0 = const()[name = string("attn_weights_2_interleave_0"), val = bool(false)]; tensor attn_weights_2_cast_fp16 = concat(axis = var_47, interleave = attn_weights_2_interleave_0, values = (var_163_cast_fp16, var_167_cast_fp16, var_171_cast_fp16, var_175_cast_fp16, var_179_cast_fp16, var_183_cast_fp16, var_187_cast_fp16, var_191_cast_fp16))[name = string("attn_weights_2_cast_fp16")]; tensor attn_weights0_2_cast_fp16 = add(x = attn_weights_2_cast_fp16, y = var_33_cast_fp16)[name = string("attn_weights0_2_cast_fp16")]; tensor input_3_cast_fp16 = softmax(axis = var_46, x = attn_weights0_2_cast_fp16)[name = string("input_3_cast_fp16")]; tensor tile_3 = const()[name = string("tile_3"), val = tensor([1, 1, 1, 1, 1, 1, 1, 1])]; int32 var_197_axis_0 = const()[name = string("op_197_axis_0"), val = int32(2)]; tensor var_197_cast_fp16_0, tensor var_197_cast_fp16_1, tensor var_197_cast_fp16_2, tensor var_197_cast_fp16_3, tensor var_197_cast_fp16_4, tensor var_197_cast_fp16_5, tensor var_197_cast_fp16_6, tensor var_197_cast_fp16_7 = split(axis = var_197_axis_0, split_sizes = tile_3, x = input_3_cast_fp16)[name = string("op_197_cast_fp16")]; string var_207_equation_0 = const()[name = string("op_207_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_207_cast_fp16 = einsum(equation = var_207_equation_0, values = (var_151_cast_fp16_0, var_197_cast_fp16_0))[name = string("op_207_cast_fp16")]; string var_209_equation_0 = const()[name = string("op_209_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_209_cast_fp16 = einsum(equation = var_209_equation_0, values = (var_151_cast_fp16_1, var_197_cast_fp16_1))[name = string("op_209_cast_fp16")]; string var_211_equation_0 = const()[name = string("op_211_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_211_cast_fp16 = einsum(equation = var_211_equation_0, values = (var_151_cast_fp16_2, var_197_cast_fp16_2))[name = string("op_211_cast_fp16")]; string var_213_equation_0 = const()[name = string("op_213_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_213_cast_fp16 = einsum(equation = var_213_equation_0, values = (var_151_cast_fp16_3, var_197_cast_fp16_3))[name = string("op_213_cast_fp16")]; string var_215_equation_0 = const()[name = string("op_215_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_215_cast_fp16 = einsum(equation = var_215_equation_0, values = (var_151_cast_fp16_4, var_197_cast_fp16_4))[name = string("op_215_cast_fp16")]; string var_217_equation_0 = const()[name = string("op_217_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_217_cast_fp16 = einsum(equation = var_217_equation_0, values = (var_151_cast_fp16_5, var_197_cast_fp16_5))[name = string("op_217_cast_fp16")]; string var_219_equation_0 = const()[name = string("op_219_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_219_cast_fp16 = einsum(equation = var_219_equation_0, values = (var_151_cast_fp16_6, var_197_cast_fp16_6))[name = string("op_219_cast_fp16")]; string var_221_equation_0 = const()[name = string("op_221_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_221_cast_fp16 = einsum(equation = var_221_equation_0, values = (var_151_cast_fp16_7, var_197_cast_fp16_7))[name = string("op_221_cast_fp16")]; bool attn_6_interleave_0 = const()[name = string("attn_6_interleave_0"), val = bool(false)]; tensor attn_6_cast_fp16 = concat(axis = var_46, interleave = attn_6_interleave_0, values = (var_207_cast_fp16, var_209_cast_fp16, var_211_cast_fp16, var_213_cast_fp16, var_215_cast_fp16, var_217_cast_fp16, var_219_cast_fp16, var_221_cast_fp16))[name = string("attn_6_cast_fp16")]; tensor var_229 = const()[name = string("op_229"), val = tensor([1, 1])]; tensor var_231 = const()[name = string("op_231"), val = tensor([1, 1])]; string attn_8_pad_type_0 = const()[name = string("attn_8_pad_type_0"), val = string("custom")]; tensor attn_8_pad_0 = const()[name = string("attn_8_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_0_attn_out_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_0_attn_out_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(18955456))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(19218240))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(19217664)))]; tensor nlp_net_default_encoder_transformer_layers_0_attn_out_proj_bias_to_fp16 = const()[name = string("nlp_net_default_encoder_transformer_layers_0_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(19219328)))]; tensor attn_8_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_0_attn_out_proj_bias_to_fp16, dilations = var_231, groups = var_46, pad = attn_8_pad_0, pad_type = attn_8_pad_type_0, strides = var_229, weight = nlp_net_default_encoder_transformer_layers_0_attn_out_proj_weight_to_fp16_affine_quantized, x = attn_6_cast_fp16)[name = string("attn_8_cast_fp16")]; tensor inputs_1_cast_fp16 = add(x = transpose_9, y = attn_8_cast_fp16)[name = string("inputs_1_cast_fp16")]; tensor input_5_axes_0 = const()[name = string("input_5_axes_0"), val = tensor([1])]; tensor input_5_gamma_0_to_fp16 = const()[name = string("input_5_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(19220416)))]; tensor input_5_beta_0_to_fp16 = const()[name = string("input_5_beta_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(19221504)))]; fp16 var_243_to_fp16 = const()[name = string("op_243_to_fp16"), val = fp16(0x1.5p-17)]; tensor input_5_cast_fp16 = layer_norm(axes = input_5_axes_0, beta = input_5_beta_0_to_fp16, epsilon = var_243_to_fp16, gamma = input_5_gamma_0_to_fp16, x = inputs_1_cast_fp16)[name = string("input_5_cast_fp16")]; tensor var_257 = const()[name = string("op_257"), val = tensor([1, 1])]; tensor var_259 = const()[name = string("op_259"), val = tensor([1, 1])]; string x_2_pad_type_0 = const()[name = string("x_2_pad_type_0"), val = string("custom")]; tensor x_2_pad_0 = const()[name = string("x_2_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_0_ffn_expand_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_0_ffn_expand_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(19222592))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(20273344))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(20271232)))]; tensor nlp_net_default_encoder_transformer_layers_0_ffn_expand_proj_bias_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_0_ffn_expand_proj_bias_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(20277504))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(20281728))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(20279616)))]; tensor x_2_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_0_ffn_expand_proj_bias_to_fp16_affine_quantized, dilations = var_259, groups = var_46, pad = x_2_pad_0, pad_type = x_2_pad_type_0, strides = var_257, weight = nlp_net_default_encoder_transformer_layers_0_ffn_expand_proj_weight_to_fp16_affine_quantized, x = input_5_cast_fp16)[name = string("x_2_cast_fp16")]; fp16 var_262_to_fp16 = const()[name = string("op_262_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_263_cast_fp16 = mul(x = x_2_cast_fp16, y = var_262_to_fp16)[name = string("op_263_cast_fp16")]; tensor var_264_cast_fp16 = sigmoid(x = var_263_cast_fp16)[name = string("op_264_cast_fp16")]; tensor input_7_cast_fp16 = mul(x = x_2_cast_fp16, y = var_264_cast_fp16)[name = string("input_7_cast_fp16")]; tensor var_268 = const()[name = string("op_268"), val = tensor([1, 1])]; tensor var_270 = const()[name = string("op_270"), val = tensor([1, 1])]; string input0_3_pad_type_0 = const()[name = string("input0_3_pad_type_0"), val = string("custom")]; tensor input0_3_pad_0 = const()[name = string("input0_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_0_ffn_contract_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_0_ffn_contract_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(20285888))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21335104))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21334528)))]; tensor nlp_net_default_encoder_transformer_layers_0_ffn_contract_proj_bias_to_fp16 = const()[name = string("nlp_net_default_encoder_transformer_layers_0_ffn_contract_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21336192)))]; tensor input0_3_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_0_ffn_contract_proj_bias_to_fp16, dilations = var_270, groups = var_46, pad = input0_3_pad_0, pad_type = input0_3_pad_type_0, strides = var_268, weight = nlp_net_default_encoder_transformer_layers_0_ffn_contract_proj_weight_to_fp16_affine_quantized, x = input_7_cast_fp16)[name = string("input0_3_cast_fp16")]; tensor var_274_cast_fp16 = add(x = input0_3_cast_fp16, y = inputs_1_cast_fp16)[name = string("op_274_cast_fp16")]; fp16 var_275_to_fp16 = const()[name = string("op_275_to_fp16"), val = fp16(0x0p+0)]; tensor var_276_cast_fp16 = mul(x = transpose_9, y = var_275_to_fp16)[name = string("op_276_cast_fp16")]; tensor inputs_2_cast_fp16 = add(x = var_276_cast_fp16, y = var_274_cast_fp16)[name = string("inputs_2_cast_fp16")]; tensor k_7_axes_0 = const()[name = string("k_7_axes_0"), val = tensor([1])]; tensor k_7_gamma_0_to_fp16 = const()[name = string("k_7_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21337280)))]; tensor k_7_beta_0_to_fp16 = const()[name = string("k_7_beta_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21338368)))]; fp16 var_292_to_fp16 = const()[name = string("op_292_to_fp16"), val = fp16(0x1.5p-17)]; tensor k_7_cast_fp16 = layer_norm(axes = k_7_axes_0, beta = k_7_beta_0_to_fp16, epsilon = var_292_to_fp16, gamma = k_7_gamma_0_to_fp16, x = inputs_2_cast_fp16)[name = string("k_7_cast_fp16")]; tensor var_311 = const()[name = string("op_311"), val = tensor([1, 1])]; tensor var_313 = const()[name = string("op_313"), val = tensor([1, 1])]; string var_315_pad_type_0 = const()[name = string("op_315_pad_type_0"), val = string("custom")]; tensor var_315_pad_0 = const()[name = string("op_315_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_1_attn_q_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_1_attn_q_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21339456))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21602240))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21601664)))]; tensor nlp_net_default_encoder_transformer_layers_1_attn_q_proj_bias_to_fp16 = const()[name = string("nlp_net_default_encoder_transformer_layers_1_attn_q_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21603328)))]; tensor var_315_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_1_attn_q_proj_bias_to_fp16, dilations = var_313, groups = var_46, pad = var_315_pad_0, pad_type = var_315_pad_type_0, strides = var_311, weight = nlp_net_default_encoder_transformer_layers_1_attn_q_proj_weight_to_fp16_affine_quantized, x = k_7_cast_fp16)[name = string("op_315_cast_fp16")]; tensor var_318 = const()[name = string("op_318"), val = tensor([1, 1])]; tensor var_320 = const()[name = string("op_320"), val = tensor([1, 1])]; string k_9_pad_type_0 = const()[name = string("k_9_pad_type_0"), val = string("custom")]; tensor k_9_pad_0 = const()[name = string("k_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_1_attn_k_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_1_attn_k_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21604416))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21867200))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21866624)))]; tensor nlp_net_default_encoder_transformer_layers_1_attn_k_proj_bias_to_fp16 = const()[name = string("nlp_net_default_encoder_transformer_layers_1_attn_k_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21868288)))]; tensor k_9_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_1_attn_k_proj_bias_to_fp16, dilations = var_320, groups = var_46, pad = k_9_pad_0, pad_type = k_9_pad_type_0, strides = var_318, weight = nlp_net_default_encoder_transformer_layers_1_attn_k_proj_weight_to_fp16_affine_quantized, x = k_7_cast_fp16)[name = string("k_9_cast_fp16")]; tensor var_325 = const()[name = string("op_325"), val = tensor([1, 1])]; tensor var_327 = const()[name = string("op_327"), val = tensor([1, 1])]; string var_329_pad_type_0 = const()[name = string("op_329_pad_type_0"), val = string("custom")]; tensor var_329_pad_0 = const()[name = string("op_329_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_1_attn_v_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_1_attn_v_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(21869376))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(22132160))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(22131584)))]; tensor nlp_net_default_encoder_transformer_layers_1_attn_v_proj_bias_to_fp16 = const()[name = string("nlp_net_default_encoder_transformer_layers_1_attn_v_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(22133248)))]; tensor var_329_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_1_attn_v_proj_bias_to_fp16, dilations = var_327, groups = var_46, pad = var_329_pad_0, pad_type = var_329_pad_type_0, strides = var_325, weight = nlp_net_default_encoder_transformer_layers_1_attn_v_proj_weight_to_fp16_affine_quantized, x = k_7_cast_fp16)[name = string("op_329_cast_fp16")]; tensor tile_4 = const()[name = string("tile_4"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; int32 var_330_axis_0 = const()[name = string("op_330_axis_0"), val = int32(1)]; tensor var_330_cast_fp16_0, tensor var_330_cast_fp16_1, tensor var_330_cast_fp16_2, tensor var_330_cast_fp16_3, tensor var_330_cast_fp16_4, tensor var_330_cast_fp16_5, tensor var_330_cast_fp16_6, tensor var_330_cast_fp16_7 = split(axis = var_330_axis_0, split_sizes = tile_4, x = var_315_cast_fp16)[name = string("op_330_cast_fp16")]; tensor var_339_perm_0 = const()[name = string("op_339_perm_0"), val = tensor([0, 3, 2, 1])]; tensor tile_5 = const()[name = string("tile_5"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; int32 var_340_axis_0 = const()[name = string("op_340_axis_0"), val = int32(3)]; tensor transpose_7 = transpose(perm = var_339_perm_0, x = k_9_cast_fp16)[name = string("transpose_7")]; tensor var_340_cast_fp16_0, tensor var_340_cast_fp16_1, tensor var_340_cast_fp16_2, tensor var_340_cast_fp16_3, tensor var_340_cast_fp16_4, tensor var_340_cast_fp16_5, tensor var_340_cast_fp16_6, tensor var_340_cast_fp16_7 = split(axis = var_340_axis_0, split_sizes = tile_5, x = transpose_7)[name = string("op_340_cast_fp16")]; tensor tile_6 = const()[name = string("tile_6"), val = tensor([64, 64, 64, 64, 64, 64, 64, 64])]; int32 var_349_axis_0 = const()[name = string("op_349_axis_0"), val = int32(1)]; tensor var_349_cast_fp16_0, tensor var_349_cast_fp16_1, tensor var_349_cast_fp16_2, tensor var_349_cast_fp16_3, tensor var_349_cast_fp16_4, tensor var_349_cast_fp16_5, tensor var_349_cast_fp16_6, tensor var_349_cast_fp16_7 = split(axis = var_349_axis_0, split_sizes = tile_6, x = var_329_cast_fp16)[name = string("op_349_cast_fp16")]; string var_359_equation_0 = const()[name = string("op_359_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_359_cast_fp16 = einsum(equation = var_359_equation_0, values = (var_340_cast_fp16_0, var_330_cast_fp16_0))[name = string("op_359_cast_fp16")]; fp16 var_360_to_fp16 = const()[name = string("op_360_to_fp16"), val = fp16(0x1p-3)]; tensor var_361_cast_fp16 = mul(x = var_359_cast_fp16, y = var_360_to_fp16)[name = string("op_361_cast_fp16")]; string var_363_equation_0 = const()[name = string("op_363_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_363_cast_fp16 = einsum(equation = var_363_equation_0, values = (var_340_cast_fp16_1, var_330_cast_fp16_1))[name = string("op_363_cast_fp16")]; fp16 var_364_to_fp16 = const()[name = string("op_364_to_fp16"), val = fp16(0x1p-3)]; tensor var_365_cast_fp16 = mul(x = var_363_cast_fp16, y = var_364_to_fp16)[name = string("op_365_cast_fp16")]; string var_367_equation_0 = const()[name = string("op_367_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_367_cast_fp16 = einsum(equation = var_367_equation_0, values = (var_340_cast_fp16_2, var_330_cast_fp16_2))[name = string("op_367_cast_fp16")]; fp16 var_368_to_fp16 = const()[name = string("op_368_to_fp16"), val = fp16(0x1p-3)]; tensor var_369_cast_fp16 = mul(x = var_367_cast_fp16, y = var_368_to_fp16)[name = string("op_369_cast_fp16")]; string var_371_equation_0 = const()[name = string("op_371_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_371_cast_fp16 = einsum(equation = var_371_equation_0, values = (var_340_cast_fp16_3, var_330_cast_fp16_3))[name = string("op_371_cast_fp16")]; fp16 var_372_to_fp16 = const()[name = string("op_372_to_fp16"), val = fp16(0x1p-3)]; tensor var_373_cast_fp16 = mul(x = var_371_cast_fp16, y = var_372_to_fp16)[name = string("op_373_cast_fp16")]; string var_375_equation_0 = const()[name = string("op_375_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_375_cast_fp16 = einsum(equation = var_375_equation_0, values = (var_340_cast_fp16_4, var_330_cast_fp16_4))[name = string("op_375_cast_fp16")]; fp16 var_376_to_fp16 = const()[name = string("op_376_to_fp16"), val = fp16(0x1p-3)]; tensor var_377_cast_fp16 = mul(x = var_375_cast_fp16, y = var_376_to_fp16)[name = string("op_377_cast_fp16")]; string var_379_equation_0 = const()[name = string("op_379_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_379_cast_fp16 = einsum(equation = var_379_equation_0, values = (var_340_cast_fp16_5, var_330_cast_fp16_5))[name = string("op_379_cast_fp16")]; fp16 var_380_to_fp16 = const()[name = string("op_380_to_fp16"), val = fp16(0x1p-3)]; tensor var_381_cast_fp16 = mul(x = var_379_cast_fp16, y = var_380_to_fp16)[name = string("op_381_cast_fp16")]; string var_383_equation_0 = const()[name = string("op_383_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_383_cast_fp16 = einsum(equation = var_383_equation_0, values = (var_340_cast_fp16_6, var_330_cast_fp16_6))[name = string("op_383_cast_fp16")]; fp16 var_384_to_fp16 = const()[name = string("op_384_to_fp16"), val = fp16(0x1p-3)]; tensor var_385_cast_fp16 = mul(x = var_383_cast_fp16, y = var_384_to_fp16)[name = string("op_385_cast_fp16")]; string var_387_equation_0 = const()[name = string("op_387_equation_0"), val = string("bkhc,bchq->bkhq")]; tensor var_387_cast_fp16 = einsum(equation = var_387_equation_0, values = (var_340_cast_fp16_7, var_330_cast_fp16_7))[name = string("op_387_cast_fp16")]; fp16 var_388_to_fp16 = const()[name = string("op_388_to_fp16"), val = fp16(0x1p-3)]; tensor var_389_cast_fp16 = mul(x = var_387_cast_fp16, y = var_388_to_fp16)[name = string("op_389_cast_fp16")]; bool attn_weights_4_interleave_0 = const()[name = string("attn_weights_4_interleave_0"), val = bool(false)]; tensor attn_weights_4_cast_fp16 = concat(axis = var_47, interleave = attn_weights_4_interleave_0, values = (var_361_cast_fp16, var_365_cast_fp16, var_369_cast_fp16, var_373_cast_fp16, var_377_cast_fp16, var_381_cast_fp16, var_385_cast_fp16, var_389_cast_fp16))[name = string("attn_weights_4_cast_fp16")]; tensor attn_weights0_4_cast_fp16 = add(x = attn_weights_4_cast_fp16, y = var_33_cast_fp16)[name = string("attn_weights0_4_cast_fp16")]; tensor input_9_cast_fp16 = softmax(axis = var_46, x = attn_weights0_4_cast_fp16)[name = string("input_9_cast_fp16")]; tensor tile_7 = const()[name = string("tile_7"), val = tensor([1, 1, 1, 1, 1, 1, 1, 1])]; int32 var_395_axis_0 = const()[name = string("op_395_axis_0"), val = int32(2)]; tensor var_395_cast_fp16_0, tensor var_395_cast_fp16_1, tensor var_395_cast_fp16_2, tensor var_395_cast_fp16_3, tensor var_395_cast_fp16_4, tensor var_395_cast_fp16_5, tensor var_395_cast_fp16_6, tensor var_395_cast_fp16_7 = split(axis = var_395_axis_0, split_sizes = tile_7, x = input_9_cast_fp16)[name = string("op_395_cast_fp16")]; string var_405_equation_0 = const()[name = string("op_405_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_405_cast_fp16 = einsum(equation = var_405_equation_0, values = (var_349_cast_fp16_0, var_395_cast_fp16_0))[name = string("op_405_cast_fp16")]; string var_407_equation_0 = const()[name = string("op_407_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_407_cast_fp16 = einsum(equation = var_407_equation_0, values = (var_349_cast_fp16_1, var_395_cast_fp16_1))[name = string("op_407_cast_fp16")]; string var_409_equation_0 = const()[name = string("op_409_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_409_cast_fp16 = einsum(equation = var_409_equation_0, values = (var_349_cast_fp16_2, var_395_cast_fp16_2))[name = string("op_409_cast_fp16")]; string var_411_equation_0 = const()[name = string("op_411_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_411_cast_fp16 = einsum(equation = var_411_equation_0, values = (var_349_cast_fp16_3, var_395_cast_fp16_3))[name = string("op_411_cast_fp16")]; string var_413_equation_0 = const()[name = string("op_413_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_413_cast_fp16 = einsum(equation = var_413_equation_0, values = (var_349_cast_fp16_4, var_395_cast_fp16_4))[name = string("op_413_cast_fp16")]; string var_415_equation_0 = const()[name = string("op_415_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_415_cast_fp16 = einsum(equation = var_415_equation_0, values = (var_349_cast_fp16_5, var_395_cast_fp16_5))[name = string("op_415_cast_fp16")]; string var_417_equation_0 = const()[name = string("op_417_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_417_cast_fp16 = einsum(equation = var_417_equation_0, values = (var_349_cast_fp16_6, var_395_cast_fp16_6))[name = string("op_417_cast_fp16")]; string var_419_equation_0 = const()[name = string("op_419_equation_0"), val = string("bchk,bkhq->bchq")]; tensor var_419_cast_fp16 = einsum(equation = var_419_equation_0, values = (var_349_cast_fp16_7, var_395_cast_fp16_7))[name = string("op_419_cast_fp16")]; bool attn_12_interleave_0 = const()[name = string("attn_12_interleave_0"), val = bool(false)]; tensor attn_12_cast_fp16 = concat(axis = var_46, interleave = attn_12_interleave_0, values = (var_405_cast_fp16, var_407_cast_fp16, var_409_cast_fp16, var_411_cast_fp16, var_413_cast_fp16, var_415_cast_fp16, var_417_cast_fp16, var_419_cast_fp16))[name = string("attn_12_cast_fp16")]; tensor var_427 = const()[name = string("op_427"), val = tensor([1, 1])]; tensor var_429 = const()[name = string("op_429"), val = tensor([1, 1])]; string attn_14_pad_type_0 = const()[name = string("attn_14_pad_type_0"), val = string("custom")]; tensor attn_14_pad_0 = const()[name = string("attn_14_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_1_attn_out_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_1_attn_out_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(22134336))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(22397120))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(22396544)))]; tensor nlp_net_default_encoder_transformer_layers_1_attn_out_proj_bias_to_fp16 = const()[name = string("nlp_net_default_encoder_transformer_layers_1_attn_out_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(22398208)))]; tensor attn_14_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_1_attn_out_proj_bias_to_fp16, dilations = var_429, groups = var_46, pad = attn_14_pad_0, pad_type = attn_14_pad_type_0, strides = var_427, weight = nlp_net_default_encoder_transformer_layers_1_attn_out_proj_weight_to_fp16_affine_quantized, x = attn_12_cast_fp16)[name = string("attn_14_cast_fp16")]; tensor inputs0_4_cast_fp16 = add(x = inputs_2_cast_fp16, y = attn_14_cast_fp16)[name = string("inputs0_4_cast_fp16")]; tensor input_11_axes_0 = const()[name = string("input_11_axes_0"), val = tensor([1])]; tensor input_11_gamma_0_to_fp16 = const()[name = string("input_11_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(22399296)))]; tensor input_11_beta_0_to_fp16 = const()[name = string("input_11_beta_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(22400384)))]; fp16 var_441_to_fp16 = const()[name = string("op_441_to_fp16"), val = fp16(0x1.5p-17)]; tensor input_11_cast_fp16 = layer_norm(axes = input_11_axes_0, beta = input_11_beta_0_to_fp16, epsilon = var_441_to_fp16, gamma = input_11_gamma_0_to_fp16, x = inputs0_4_cast_fp16)[name = string("input_11_cast_fp16")]; tensor var_455 = const()[name = string("op_455"), val = tensor([1, 1])]; tensor var_457 = const()[name = string("op_457"), val = tensor([1, 1])]; string x_4_pad_type_0 = const()[name = string("x_4_pad_type_0"), val = string("custom")]; tensor x_4_pad_0 = const()[name = string("x_4_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_1_ffn_expand_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_1_ffn_expand_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(22401472))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(23452224))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(23450112)))]; tensor nlp_net_default_encoder_transformer_layers_1_ffn_expand_proj_bias_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_1_ffn_expand_proj_bias_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(23456384))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(23460608))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(23458496)))]; tensor x_4_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_1_ffn_expand_proj_bias_to_fp16_affine_quantized, dilations = var_457, groups = var_46, pad = x_4_pad_0, pad_type = x_4_pad_type_0, strides = var_455, weight = nlp_net_default_encoder_transformer_layers_1_ffn_expand_proj_weight_to_fp16_affine_quantized, x = input_11_cast_fp16)[name = string("x_4_cast_fp16")]; fp16 var_460_to_fp16 = const()[name = string("op_460_to_fp16"), val = fp16(0x1.b3cp+0)]; tensor var_461_cast_fp16 = mul(x = x_4_cast_fp16, y = var_460_to_fp16)[name = string("op_461_cast_fp16")]; tensor var_462_cast_fp16 = sigmoid(x = var_461_cast_fp16)[name = string("op_462_cast_fp16")]; tensor input_13_cast_fp16 = mul(x = x_4_cast_fp16, y = var_462_cast_fp16)[name = string("input_13_cast_fp16")]; tensor var_466 = const()[name = string("op_466"), val = tensor([1, 1])]; tensor var_468 = const()[name = string("op_468"), val = tensor([1, 1])]; string input0_7_pad_type_0 = const()[name = string("input0_7_pad_type_0"), val = string("custom")]; tensor input0_7_pad_0 = const()[name = string("input0_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor nlp_net_default_encoder_transformer_layers_1_ffn_contract_proj_weight_to_fp16_affine_quantized = constexpr_affine_dequantize()[axis = int32(0), name = string("nlp_net_default_encoder_transformer_layers_1_ffn_contract_proj_weight_to_fp16_affine_quantized"), quantized_data = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(23464768))), scale = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(24513984))), zero_point = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(24513408)))]; tensor nlp_net_default_encoder_transformer_layers_1_ffn_contract_proj_bias_to_fp16 = const()[name = string("nlp_net_default_encoder_transformer_layers_1_ffn_contract_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(24515072)))]; tensor input0_7_cast_fp16 = conv(bias = nlp_net_default_encoder_transformer_layers_1_ffn_contract_proj_bias_to_fp16, dilations = var_468, groups = var_46, pad = input0_7_pad_0, pad_type = input0_7_pad_type_0, strides = var_466, weight = nlp_net_default_encoder_transformer_layers_1_ffn_contract_proj_weight_to_fp16_affine_quantized, x = input_13_cast_fp16)[name = string("input0_7_cast_fp16")]; tensor var_472_cast_fp16 = add(x = input0_7_cast_fp16, y = inputs0_4_cast_fp16)[name = string("op_472_cast_fp16")]; fp16 var_473_to_fp16 = const()[name = string("op_473_to_fp16"), val = fp16(0x0p+0)]; tensor var_474_cast_fp16 = mul(x = inputs_2_cast_fp16, y = var_473_to_fp16)[name = string("op_474_cast_fp16")]; tensor inputs0_2_cast_fp16 = add(x = var_474_cast_fp16, y = var_472_cast_fp16)[name = string("inputs0_2_cast_fp16")]; tensor k_11_axes_0 = const()[name = string("k_11_axes_0"), val = tensor([1])]; tensor k_11_gamma_0_to_fp16 = const()[name = string("k_11_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(24516160)))]; tensor k_11_beta_0_to_fp16 = const()[name = string("k_11_beta_0_to_fp16"), val = tensor(BLOBFILE(path = string("@model_path/weights/weight.bin"), offset = uint64(24517248)))]; fp16 var_490_to_fp16 = const()[name = string("op_490_to_fp16"), val = fp16(0x1.5p-17)]; tensor k_11_cast_fp16 = layer_norm(axes = k_11_axes_0, beta = k_11_beta_0_to_fp16, epsilon = var_490_to_fp16, gamma = k_11_gamma_0_to_fp16, x = inputs0_2_cast_fp16)[name = string("k_11_cast_fp16")]; tensor var_509 = const()[name = string("op_509"), val = tensor