program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3520.4.1"}, {"coremlc-version", "3520.5.1"}, {"coremltools-component-torch", "2.11.0"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "8.3.0"}})] { func main(tensor embedding, tensor features, tensor sigma, tensor x_noisy) { tensor var_25 = const()[name = tensor("op_25"), val = tensor([-1, 1, 1])]; tensor sigma_to_fp16_dtype_0 = const()[name = tensor("sigma_to_fp16_dtype_0"), val = tensor("fp16")]; tensor sigma_to_fp16 = cast(dtype = sigma_to_fp16_dtype_0, x = sigma)[name = tensor("cast_27")]; tensor s_cast_fp16 = reshape(shape = var_25, x = sigma_to_fp16)[name = tensor("s_cast_fp16")]; tensor var_27_cast_fp16 = mul(x = s_cast_fp16, y = s_cast_fp16)[name = tensor("op_27_cast_fp16")]; tensor var_29_to_fp16 = const()[name = tensor("op_29_to_fp16"), val = tensor(0x1.47cp-5)]; tensor var_30_cast_fp16 = add(x = var_27_cast_fp16, y = var_29_to_fp16)[name = tensor("op_30_cast_fp16")]; tensor var_31_epsilon_0 = const()[name = tensor("op_31_epsilon_0"), val = tensor(0x1.a36e2ep-14)]; tensor var_31_cast_fp16 = inverse(epsilon = var_31_epsilon_0, x = var_30_cast_fp16)[name = tensor("op_31_cast_fp16")]; tensor var_32_to_fp16 = const()[name = tensor("op_32_to_fp16"), val = tensor(0x1.47cp-5)]; tensor c_skip_cast_fp16 = mul(x = var_31_cast_fp16, y = var_32_to_fp16)[name = tensor("c_skip_cast_fp16")]; tensor var_34_to_fp16 = const()[name = tensor("op_34_to_fp16"), val = tensor(0x1.998p-3)]; tensor var_35_cast_fp16 = mul(x = s_cast_fp16, y = var_34_to_fp16)[name = tensor("op_35_cast_fp16")]; tensor var_40_cast_fp16 = sqrt(x = var_30_cast_fp16)[name = tensor("op_40_cast_fp16")]; tensor c_out_cast_fp16 = real_div(x = var_35_cast_fp16, y = var_40_cast_fp16)[name = tensor("c_out_cast_fp16")]; tensor var_47_epsilon_0 = const()[name = tensor("op_47_epsilon_0"), val = tensor(0x1.a36e2ep-14)]; tensor var_47_cast_fp16 = inverse(epsilon = var_47_epsilon_0, x = var_40_cast_fp16)[name = tensor("op_47_cast_fp16")]; tensor var_50_epsilon_0 = const()[name = tensor("op_50_epsilon_0"), val = tensor(0x1p-149)]; tensor var_50_cast_fp16 = log(epsilon = var_50_epsilon_0, x = sigma_to_fp16)[name = tensor("op_50_cast_fp16")]; tensor var_51_to_fp16 = const()[name = tensor("op_51_to_fp16"), val = tensor(0x1p-2)]; tensor x_1_cast_fp16 = mul(x = var_50_cast_fp16, y = var_51_to_fp16)[name = tensor("x_1_cast_fp16")]; tensor x_noisy_to_fp16_dtype_0 = const()[name = tensor("x_noisy_to_fp16_dtype_0"), val = tensor("fp16")]; tensor x_noisy_to_fp16 = cast(dtype = x_noisy_to_fp16_dtype_0, x = x_noisy)[name = tensor("cast_26")]; tensor x_11_cast_fp16 = mul(x = var_47_cast_fp16, y = x_noisy_to_fp16)[name = tensor("x_11_cast_fp16")]; tensor var_55 = const()[name = tensor("op_55"), val = tensor(-1)]; tensor var_67 = const()[name = tensor("op_67"), val = tensor([1, 1])]; tensor x_5_cast_fp16 = reshape(shape = var_67, x = x_1_cast_fp16)[name = tensor("x_5_cast_fp16")]; tensor var_75_to_fp16 = const()[name = tensor("op_75_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor var_76_cast_fp16 = mul(x = x_5_cast_fp16, y = var_75_to_fp16)[name = tensor("op_76_cast_fp16")]; tensor var_77_promoted_to_fp16 = const()[name = tensor("op_77_promoted_to_fp16"), val = tensor(0x1p+1)]; tensor var_78_cast_fp16 = mul(x = var_76_cast_fp16, y = var_77_promoted_to_fp16)[name = tensor("op_78_cast_fp16")]; tensor var_79_to_fp16 = const()[name = tensor("op_79_to_fp16"), val = tensor(0x1.92p+1)]; tensor freqs_cast_fp16 = mul(x = var_78_cast_fp16, y = var_79_to_fp16)[name = tensor("freqs_cast_fp16")]; tensor var_81_cast_fp16 = sin(x = freqs_cast_fp16)[name = tensor("op_81_cast_fp16")]; tensor var_82_cast_fp16 = cos(x = freqs_cast_fp16)[name = tensor("op_82_cast_fp16")]; tensor input_1_interleave_0 = const()[name = tensor("input_1_interleave_0"), val = tensor(false)]; tensor input_1_cast_fp16 = concat(axis = var_55, interleave = input_1_interleave_0, values = (x_5_cast_fp16, var_81_cast_fp16, var_82_cast_fp16))[name = tensor("input_1_cast_fp16")]; tensor transformer_to_time_0_1_weight_to_fp16 = const()[name = tensor("transformer_to_time_0_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(384)))]; tensor transformer_to_time_0_1_bias_to_fp16 = const()[name = tensor("transformer_to_time_0_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(526784)))]; tensor linear_0_cast_fp16 = linear(bias = transformer_to_time_0_1_bias_to_fp16, weight = transformer_to_time_0_1_weight_to_fp16, x = input_1_cast_fp16)[name = tensor("linear_0_cast_fp16")]; tensor var_88_mode_0 = const()[name = tensor("op_88_mode_0"), val = tensor("EXACT")]; tensor var_88_cast_fp16 = gelu(mode = var_88_mode_0, x = linear_0_cast_fp16)[name = tensor("op_88_cast_fp16")]; tensor features_to_fp16_dtype_0 = const()[name = tensor("features_to_fp16_dtype_0"), val = tensor("fp16")]; tensor transformer_to_features_0_weight_to_fp16 = const()[name = tensor("transformer_to_features_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(528896)))]; tensor transformer_to_features_0_bias_to_fp16 = const()[name = tensor("transformer_to_features_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1053248)))]; tensor features_to_fp16 = cast(dtype = features_to_fp16_dtype_0, x = features)[name = tensor("cast_25")]; tensor linear_1_cast_fp16 = linear(bias = transformer_to_features_0_bias_to_fp16, weight = transformer_to_features_0_weight_to_fp16, x = features_to_fp16)[name = tensor("linear_1_cast_fp16")]; tensor var_94_mode_0 = const()[name = tensor("op_94_mode_0"), val = tensor("EXACT")]; tensor var_94_cast_fp16 = gelu(mode = var_94_mode_0, x = linear_1_cast_fp16)[name = tensor("op_94_cast_fp16")]; tensor x_7_axis_0 = const()[name = tensor("x_7_axis_0"), val = tensor(0)]; tensor x_7_cast_fp16 = stack(axis = x_7_axis_0, values = (var_88_cast_fp16, var_94_cast_fp16))[name = tensor("x_7_cast_fp16")]; tensor var_101 = const()[name = tensor("op_101"), val = tensor([1, 2, 0])]; tensor input_7_axes_0 = const()[name = tensor("input_7_axes_0"), val = tensor([2])]; tensor input_7_keep_dims_0 = const()[name = tensor("input_7_keep_dims_0"), val = tensor(false)]; tensor x_9_cast_fp16 = transpose(perm = var_101, x = x_7_cast_fp16)[name = tensor("transpose_41")]; tensor input_7_cast_fp16 = reduce_sum(axes = input_7_axes_0, keep_dims = input_7_keep_dims_0, x = x_9_cast_fp16)[name = tensor("input_7_cast_fp16")]; tensor transformer_to_mapping_0_weight_to_fp16 = const()[name = tensor("transformer_to_mapping_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1055360)))]; tensor transformer_to_mapping_0_bias_to_fp16 = const()[name = tensor("transformer_to_mapping_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3152576)))]; tensor linear_2_cast_fp16 = linear(bias = transformer_to_mapping_0_bias_to_fp16, weight = transformer_to_mapping_0_weight_to_fp16, x = input_7_cast_fp16)[name = tensor("linear_2_cast_fp16")]; tensor input_11_mode_0 = const()[name = tensor("input_11_mode_0"), val = tensor("EXACT")]; tensor input_11_cast_fp16 = gelu(mode = input_11_mode_0, x = linear_2_cast_fp16)[name = tensor("input_11_cast_fp16")]; tensor transformer_to_mapping_2_weight_to_fp16 = const()[name = tensor("transformer_to_mapping_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3154688)))]; tensor transformer_to_mapping_2_bias_to_fp16 = const()[name = tensor("transformer_to_mapping_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5251904)))]; tensor linear_3_cast_fp16 = linear(bias = transformer_to_mapping_2_bias_to_fp16, weight = transformer_to_mapping_2_weight_to_fp16, x = input_11_cast_fp16)[name = tensor("linear_3_cast_fp16")]; tensor mapping_1_mode_0 = const()[name = tensor("mapping_1_mode_0"), val = tensor("EXACT")]; tensor mapping_1_cast_fp16 = gelu(mode = mapping_1_mode_0, x = linear_3_cast_fp16)[name = tensor("mapping_1_cast_fp16")]; tensor var_127_reps_0 = const()[name = tensor("op_127_reps_0"), val = tensor([1, 512, 1])]; tensor var_127_cast_fp16 = tile(reps = var_127_reps_0, x = x_11_cast_fp16)[name = tensor("op_127_cast_fp16")]; tensor var_129 = const()[name = tensor("op_129"), val = tensor(-1)]; tensor x_13_interleave_0 = const()[name = tensor("x_13_interleave_0"), val = tensor(false)]; tensor embedding_to_fp16_dtype_0 = const()[name = tensor("embedding_to_fp16_dtype_0"), val = tensor("fp16")]; tensor embedding_to_fp16 = cast(dtype = embedding_to_fp16_dtype_0, x = embedding)[name = tensor("cast_24")]; tensor x_13_cast_fp16 = concat(axis = var_129, interleave = x_13_interleave_0, values = (var_127_cast_fp16, embedding_to_fp16))[name = tensor("x_13_cast_fp16")]; tensor var_132_axes_0 = const()[name = tensor("op_132_axes_0"), val = tensor([1])]; tensor var_132_cast_fp16 = expand_dims(axes = var_132_axes_0, x = mapping_1_cast_fp16)[name = tensor("op_132_cast_fp16")]; tensor mapping_reps_0 = const()[name = tensor("mapping_reps_0"), val = tensor([1, 512, 1])]; tensor mapping_cast_fp16 = tile(reps = mapping_reps_0, x = var_132_cast_fp16)[name = tensor("mapping_cast_fp16")]; tensor x_15_cast_fp16 = add(x = x_13_cast_fp16, y = mapping_cast_fp16)[name = tensor("x_15_cast_fp16")]; tensor var_153 = const()[name = tensor("op_153"), val = tensor(-1)]; tensor transformer_blocks_0_attention_norm_fc_weight_to_fp16 = const()[name = tensor("transformer_blocks_0_attention_norm_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5254016)))]; tensor transformer_blocks_0_attention_norm_fc_bias_to_fp16 = const()[name = tensor("transformer_blocks_0_attention_norm_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6302656)))]; tensor linear_4_cast_fp16 = linear(bias = transformer_blocks_0_attention_norm_fc_bias_to_fp16, weight = transformer_blocks_0_attention_norm_fc_weight_to_fp16, x = features_to_fp16)[name = tensor("linear_4_cast_fp16")]; tensor var_172 = const()[name = tensor("op_172"), val = tensor([1, 2048, 1])]; tensor h_3_cast_fp16 = reshape(shape = var_172, x = linear_4_cast_fp16)[name = tensor("h_3_cast_fp16")]; tensor var_174_split_sizes_0 = const()[name = tensor("op_174_split_sizes_0"), val = tensor([1024, 1024])]; tensor var_174_axis_0 = const()[name = tensor("op_174_axis_0"), val = tensor(1)]; tensor var_174_cast_fp16_0, tensor var_174_cast_fp16_1 = split(axis = var_174_axis_0, split_sizes = var_174_split_sizes_0, x = h_3_cast_fp16)[name = tensor("op_174_cast_fp16")]; tensor gamma_3_perm_0 = const()[name = tensor("gamma_3_perm_0"), val = tensor([0, -1, 1])]; tensor beta_3_perm_0 = const()[name = tensor("beta_3_perm_0"), val = tensor([0, -1, 1])]; tensor x_19_axes_0 = const()[name = tensor("x_19_axes_0"), val = tensor([-1])]; tensor var_146_to_fp16 = const()[name = tensor("op_146_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_19_cast_fp16 = layer_norm(axes = x_19_axes_0, epsilon = var_146_to_fp16, x = x_15_cast_fp16)[name = tensor("x_19_cast_fp16")]; tensor var_180_promoted_to_fp16 = const()[name = tensor("op_180_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor gamma_3_cast_fp16 = transpose(perm = gamma_3_perm_0, x = var_174_cast_fp16_0)[name = tensor("transpose_40")]; tensor var_181_cast_fp16 = add(x = gamma_3_cast_fp16, y = var_180_promoted_to_fp16)[name = tensor("op_181_cast_fp16")]; tensor var_182_cast_fp16 = mul(x = var_181_cast_fp16, y = x_19_cast_fp16)[name = tensor("op_182_cast_fp16")]; tensor beta_3_cast_fp16 = transpose(perm = beta_3_perm_0, x = var_174_cast_fp16_1)[name = tensor("transpose_39")]; tensor x_21_cast_fp16 = add(x = var_182_cast_fp16, y = beta_3_cast_fp16)[name = tensor("x_21_cast_fp16")]; tensor transformer_blocks_0_attention_norm_context_fc_weight_to_fp16 = const()[name = tensor("transformer_blocks_0_attention_norm_context_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6306816)))]; tensor transformer_blocks_0_attention_norm_context_fc_bias_to_fp16 = const()[name = tensor("transformer_blocks_0_attention_norm_context_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7355456)))]; tensor linear_5_cast_fp16 = linear(bias = transformer_blocks_0_attention_norm_context_fc_bias_to_fp16, weight = transformer_blocks_0_attention_norm_context_fc_weight_to_fp16, x = features_to_fp16)[name = tensor("linear_5_cast_fp16")]; tensor var_194 = const()[name = tensor("op_194"), val = tensor([1, 2048, 1])]; tensor h_7_cast_fp16 = reshape(shape = var_194, x = linear_5_cast_fp16)[name = tensor("h_7_cast_fp16")]; tensor var_196_split_sizes_0 = const()[name = tensor("op_196_split_sizes_0"), val = tensor([1024, 1024])]; tensor var_196_axis_0 = const()[name = tensor("op_196_axis_0"), val = tensor(1)]; tensor var_196_cast_fp16_0, tensor var_196_cast_fp16_1 = split(axis = var_196_axis_0, split_sizes = var_196_split_sizes_0, x = h_7_cast_fp16)[name = tensor("op_196_cast_fp16")]; tensor gamma_7_perm_0 = const()[name = tensor("gamma_7_perm_0"), val = tensor([0, -1, 1])]; tensor beta_7_perm_0 = const()[name = tensor("beta_7_perm_0"), val = tensor([0, -1, 1])]; tensor var_202_promoted_to_fp16 = const()[name = tensor("op_202_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor gamma_7_cast_fp16 = transpose(perm = gamma_7_perm_0, x = var_196_cast_fp16_0)[name = tensor("transpose_38")]; tensor var_203_cast_fp16 = add(x = gamma_7_cast_fp16, y = var_202_promoted_to_fp16)[name = tensor("op_203_cast_fp16")]; tensor var_204_cast_fp16 = mul(x = var_203_cast_fp16, y = x_19_cast_fp16)[name = tensor("op_204_cast_fp16")]; tensor beta_7_cast_fp16 = transpose(perm = beta_7_perm_0, x = var_196_cast_fp16_1)[name = tensor("transpose_37")]; tensor x_27_cast_fp16 = add(x = var_204_cast_fp16, y = beta_7_cast_fp16)[name = tensor("x_27_cast_fp16")]; tensor transformer_blocks_0_attention_to_q_weight_to_fp16 = const()[name = tensor("transformer_blocks_0_attention_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7359616)))]; tensor linear_6_bias_0_to_fp16 = const()[name = tensor("linear_6_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8408256)))]; tensor linear_6_cast_fp16 = linear(bias = linear_6_bias_0_to_fp16, weight = transformer_blocks_0_attention_to_q_weight_to_fp16, x = x_21_cast_fp16)[name = tensor("linear_6_cast_fp16")]; tensor transformer_blocks_0_attention_to_kv_weight_to_fp16 = const()[name = tensor("transformer_blocks_0_attention_to_kv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8409344)))]; tensor linear_7_bias_0_to_fp16 = const()[name = tensor("linear_7_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10506560)))]; tensor linear_7_cast_fp16 = linear(bias = linear_7_bias_0_to_fp16, weight = transformer_blocks_0_attention_to_kv_weight_to_fp16, x = x_27_cast_fp16)[name = tensor("linear_7_cast_fp16")]; tensor var_212_split_sizes_0 = const()[name = tensor("op_212_split_sizes_0"), val = tensor([512, 512])]; tensor var_212_axis_0 = const()[name = tensor("op_212_axis_0"), val = tensor(-1)]; tensor var_212_cast_fp16_0, tensor var_212_cast_fp16_1 = split(axis = var_212_axis_0, split_sizes = var_212_split_sizes_0, x = linear_7_cast_fp16)[name = tensor("op_212_cast_fp16")]; tensor var_221 = const()[name = tensor("op_221"), val = tensor([1, 512, 8, 64])]; tensor x_31_cast_fp16 = reshape(shape = var_221, x = linear_6_cast_fp16)[name = tensor("x_31_cast_fp16")]; tensor var_231 = const()[name = tensor("op_231"), val = tensor([1, 512, 8, 64])]; tensor x_35_cast_fp16 = reshape(shape = var_231, x = var_212_cast_fp16_0)[name = tensor("x_35_cast_fp16")]; tensor var_241 = const()[name = tensor("op_241"), val = tensor([1, 512, 8, 64])]; tensor x_39_cast_fp16 = reshape(shape = var_241, x = var_212_cast_fp16_1)[name = tensor("x_39_cast_fp16")]; tensor var_243 = const()[name = tensor("op_243"), val = tensor([0, 2, 1, 3])]; tensor sim_1_transpose_x_0 = const()[name = tensor("sim_1_transpose_x_0"), val = tensor(false)]; tensor sim_1_transpose_y_0 = const()[name = tensor("sim_1_transpose_y_0"), val = tensor(false)]; tensor transpose_9_perm_0 = const()[name = tensor("transpose_9_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_10_perm_0 = const()[name = tensor("transpose_10_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_10 = transpose(perm = transpose_10_perm_0, x = x_35_cast_fp16)[name = tensor("transpose_34")]; tensor transpose_9 = transpose(perm = transpose_9_perm_0, x = x_31_cast_fp16)[name = tensor("transpose_35")]; tensor sim_1_cast_fp16 = matmul(transpose_x = sim_1_transpose_x_0, transpose_y = sim_1_transpose_y_0, x = transpose_9, y = transpose_10)[name = tensor("sim_1_cast_fp16")]; tensor var_247_to_fp16 = const()[name = tensor("op_247_to_fp16"), val = tensor(0x1p-3)]; tensor sim_3_cast_fp16 = mul(x = sim_1_cast_fp16, y = var_247_to_fp16)[name = tensor("sim_3_cast_fp16")]; tensor attn_1_cast_fp16 = softmax(axis = var_153, x = sim_3_cast_fp16)[name = tensor("attn_1_cast_fp16")]; tensor x_41_transpose_x_0 = const()[name = tensor("x_41_transpose_x_0"), val = tensor(false)]; tensor x_41_transpose_y_0 = const()[name = tensor("x_41_transpose_y_0"), val = tensor(false)]; tensor v_1_cast_fp16 = transpose(perm = var_243, x = x_39_cast_fp16)[name = tensor("transpose_36")]; tensor x_41_cast_fp16 = matmul(transpose_x = x_41_transpose_x_0, transpose_y = x_41_transpose_y_0, x = attn_1_cast_fp16, y = v_1_cast_fp16)[name = tensor("x_41_cast_fp16")]; tensor var_269 = const()[name = tensor("op_269"), val = tensor([0, 2, 1, 3])]; tensor var_271 = const()[name = tensor("op_271"), val = tensor([1, 512, 512])]; tensor x_43_cast_fp16 = transpose(perm = var_269, x = x_41_cast_fp16)[name = tensor("transpose_33")]; tensor input_23_cast_fp16 = reshape(shape = var_271, x = x_43_cast_fp16)[name = tensor("input_23_cast_fp16")]; tensor transformer_blocks_0_attention_attention_to_out_weight_to_fp16 = const()[name = tensor("transformer_blocks_0_attention_attention_to_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10508672)))]; tensor transformer_blocks_0_attention_attention_to_out_bias_to_fp16 = const()[name = tensor("transformer_blocks_0_attention_attention_to_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11557312)))]; tensor linear_8_cast_fp16 = linear(bias = transformer_blocks_0_attention_attention_to_out_bias_to_fp16, weight = transformer_blocks_0_attention_attention_to_out_weight_to_fp16, x = input_23_cast_fp16)[name = tensor("linear_8_cast_fp16")]; tensor input_25_cast_fp16 = add(x = linear_8_cast_fp16, y = x_15_cast_fp16)[name = tensor("input_25_cast_fp16")]; tensor transformer_blocks_0_feed_forward_0_weight_to_fp16 = const()[name = tensor("transformer_blocks_0_feed_forward_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11559424)))]; tensor transformer_blocks_0_feed_forward_0_bias_to_fp16 = const()[name = tensor("transformer_blocks_0_feed_forward_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15753792)))]; tensor linear_9_cast_fp16 = linear(bias = transformer_blocks_0_feed_forward_0_bias_to_fp16, weight = transformer_blocks_0_feed_forward_0_weight_to_fp16, x = input_25_cast_fp16)[name = tensor("linear_9_cast_fp16")]; tensor input_29_mode_0 = const()[name = tensor("input_29_mode_0"), val = tensor("EXACT")]; tensor input_29_cast_fp16 = gelu(mode = input_29_mode_0, x = linear_9_cast_fp16)[name = tensor("input_29_cast_fp16")]; tensor transformer_blocks_0_feed_forward_2_weight_to_fp16 = const()[name = tensor("transformer_blocks_0_feed_forward_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15757952)))]; tensor transformer_blocks_0_feed_forward_2_bias_to_fp16 = const()[name = tensor("transformer_blocks_0_feed_forward_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19952320)))]; tensor linear_10_cast_fp16 = linear(bias = transformer_blocks_0_feed_forward_2_bias_to_fp16, weight = transformer_blocks_0_feed_forward_2_weight_to_fp16, x = input_29_cast_fp16)[name = tensor("linear_10_cast_fp16")]; tensor x_45_cast_fp16 = add(x = linear_10_cast_fp16, y = input_25_cast_fp16)[name = tensor("x_45_cast_fp16")]; tensor x_47_cast_fp16 = add(x = x_45_cast_fp16, y = mapping_cast_fp16)[name = tensor("x_47_cast_fp16")]; tensor var_298 = const()[name = tensor("op_298"), val = tensor(-1)]; tensor transformer_blocks_1_attention_norm_fc_weight_to_fp16 = const()[name = tensor("transformer_blocks_1_attention_norm_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19954432)))]; tensor transformer_blocks_1_attention_norm_fc_bias_to_fp16 = const()[name = tensor("transformer_blocks_1_attention_norm_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21003072)))]; tensor linear_11_cast_fp16 = linear(bias = transformer_blocks_1_attention_norm_fc_bias_to_fp16, weight = transformer_blocks_1_attention_norm_fc_weight_to_fp16, x = features_to_fp16)[name = tensor("linear_11_cast_fp16")]; tensor var_317 = const()[name = tensor("op_317"), val = tensor([1, 2048, 1])]; tensor h_11_cast_fp16 = reshape(shape = var_317, x = linear_11_cast_fp16)[name = tensor("h_11_cast_fp16")]; tensor var_319_split_sizes_0 = const()[name = tensor("op_319_split_sizes_0"), val = tensor([1024, 1024])]; tensor var_319_axis_0 = const()[name = tensor("op_319_axis_0"), val = tensor(1)]; tensor var_319_cast_fp16_0, tensor var_319_cast_fp16_1 = split(axis = var_319_axis_0, split_sizes = var_319_split_sizes_0, x = h_11_cast_fp16)[name = tensor("op_319_cast_fp16")]; tensor gamma_11_perm_0 = const()[name = tensor("gamma_11_perm_0"), val = tensor([0, -1, 1])]; tensor beta_11_perm_0 = const()[name = tensor("beta_11_perm_0"), val = tensor([0, -1, 1])]; tensor x_51_axes_0 = const()[name = tensor("x_51_axes_0"), val = tensor([-1])]; tensor var_291_to_fp16 = const()[name = tensor("op_291_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_51_cast_fp16 = layer_norm(axes = x_51_axes_0, epsilon = var_291_to_fp16, x = x_47_cast_fp16)[name = tensor("x_51_cast_fp16")]; tensor var_325_promoted_to_fp16 = const()[name = tensor("op_325_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor gamma_11_cast_fp16 = transpose(perm = gamma_11_perm_0, x = var_319_cast_fp16_0)[name = tensor("transpose_32")]; tensor var_326_cast_fp16 = add(x = gamma_11_cast_fp16, y = var_325_promoted_to_fp16)[name = tensor("op_326_cast_fp16")]; tensor var_327_cast_fp16 = mul(x = var_326_cast_fp16, y = x_51_cast_fp16)[name = tensor("op_327_cast_fp16")]; tensor beta_11_cast_fp16 = transpose(perm = beta_11_perm_0, x = var_319_cast_fp16_1)[name = tensor("transpose_31")]; tensor x_53_cast_fp16 = add(x = var_327_cast_fp16, y = beta_11_cast_fp16)[name = tensor("x_53_cast_fp16")]; tensor transformer_blocks_1_attention_norm_context_fc_weight_to_fp16 = const()[name = tensor("transformer_blocks_1_attention_norm_context_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21007232)))]; tensor transformer_blocks_1_attention_norm_context_fc_bias_to_fp16 = const()[name = tensor("transformer_blocks_1_attention_norm_context_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22055872)))]; tensor linear_12_cast_fp16 = linear(bias = transformer_blocks_1_attention_norm_context_fc_bias_to_fp16, weight = transformer_blocks_1_attention_norm_context_fc_weight_to_fp16, x = features_to_fp16)[name = tensor("linear_12_cast_fp16")]; tensor var_339 = const()[name = tensor("op_339"), val = tensor([1, 2048, 1])]; tensor h_15_cast_fp16 = reshape(shape = var_339, x = linear_12_cast_fp16)[name = tensor("h_15_cast_fp16")]; tensor var_341_split_sizes_0 = const()[name = tensor("op_341_split_sizes_0"), val = tensor([1024, 1024])]; tensor var_341_axis_0 = const()[name = tensor("op_341_axis_0"), val = tensor(1)]; tensor var_341_cast_fp16_0, tensor var_341_cast_fp16_1 = split(axis = var_341_axis_0, split_sizes = var_341_split_sizes_0, x = h_15_cast_fp16)[name = tensor("op_341_cast_fp16")]; tensor gamma_15_perm_0 = const()[name = tensor("gamma_15_perm_0"), val = tensor([0, -1, 1])]; tensor beta_15_perm_0 = const()[name = tensor("beta_15_perm_0"), val = tensor([0, -1, 1])]; tensor var_347_promoted_to_fp16 = const()[name = tensor("op_347_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor gamma_15_cast_fp16 = transpose(perm = gamma_15_perm_0, x = var_341_cast_fp16_0)[name = tensor("transpose_30")]; tensor var_348_cast_fp16 = add(x = gamma_15_cast_fp16, y = var_347_promoted_to_fp16)[name = tensor("op_348_cast_fp16")]; tensor var_349_cast_fp16 = mul(x = var_348_cast_fp16, y = x_51_cast_fp16)[name = tensor("op_349_cast_fp16")]; tensor beta_15_cast_fp16 = transpose(perm = beta_15_perm_0, x = var_341_cast_fp16_1)[name = tensor("transpose_29")]; tensor x_59_cast_fp16 = add(x = var_349_cast_fp16, y = beta_15_cast_fp16)[name = tensor("x_59_cast_fp16")]; tensor transformer_blocks_1_attention_to_q_weight_to_fp16 = const()[name = tensor("transformer_blocks_1_attention_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22060032)))]; tensor linear_13_cast_fp16 = linear(bias = linear_6_bias_0_to_fp16, weight = transformer_blocks_1_attention_to_q_weight_to_fp16, x = x_53_cast_fp16)[name = tensor("linear_13_cast_fp16")]; tensor transformer_blocks_1_attention_to_kv_weight_to_fp16 = const()[name = tensor("transformer_blocks_1_attention_to_kv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23108672)))]; tensor linear_14_cast_fp16 = linear(bias = linear_7_bias_0_to_fp16, weight = transformer_blocks_1_attention_to_kv_weight_to_fp16, x = x_59_cast_fp16)[name = tensor("linear_14_cast_fp16")]; tensor var_357_split_sizes_0 = const()[name = tensor("op_357_split_sizes_0"), val = tensor([512, 512])]; tensor var_357_axis_0 = const()[name = tensor("op_357_axis_0"), val = tensor(-1)]; tensor var_357_cast_fp16_0, tensor var_357_cast_fp16_1 = split(axis = var_357_axis_0, split_sizes = var_357_split_sizes_0, x = linear_14_cast_fp16)[name = tensor("op_357_cast_fp16")]; tensor var_366 = const()[name = tensor("op_366"), val = tensor([1, 512, 8, 64])]; tensor x_63_cast_fp16 = reshape(shape = var_366, x = linear_13_cast_fp16)[name = tensor("x_63_cast_fp16")]; tensor var_376 = const()[name = tensor("op_376"), val = tensor([1, 512, 8, 64])]; tensor x_67_cast_fp16 = reshape(shape = var_376, x = var_357_cast_fp16_0)[name = tensor("x_67_cast_fp16")]; tensor var_386 = const()[name = tensor("op_386"), val = tensor([1, 512, 8, 64])]; tensor x_71_cast_fp16 = reshape(shape = var_386, x = var_357_cast_fp16_1)[name = tensor("x_71_cast_fp16")]; tensor var_388 = const()[name = tensor("op_388"), val = tensor([0, 2, 1, 3])]; tensor sim_5_transpose_x_0 = const()[name = tensor("sim_5_transpose_x_0"), val = tensor(false)]; tensor sim_5_transpose_y_0 = const()[name = tensor("sim_5_transpose_y_0"), val = tensor(false)]; tensor transpose_11_perm_0 = const()[name = tensor("transpose_11_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_12_perm_0 = const()[name = tensor("transpose_12_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_12 = transpose(perm = transpose_12_perm_0, x = x_67_cast_fp16)[name = tensor("transpose_26")]; tensor transpose_11 = transpose(perm = transpose_11_perm_0, x = x_63_cast_fp16)[name = tensor("transpose_27")]; tensor sim_5_cast_fp16 = matmul(transpose_x = sim_5_transpose_x_0, transpose_y = sim_5_transpose_y_0, x = transpose_11, y = transpose_12)[name = tensor("sim_5_cast_fp16")]; tensor var_392_to_fp16 = const()[name = tensor("op_392_to_fp16"), val = tensor(0x1p-3)]; tensor sim_7_cast_fp16 = mul(x = sim_5_cast_fp16, y = var_392_to_fp16)[name = tensor("sim_7_cast_fp16")]; tensor attn_3_cast_fp16 = softmax(axis = var_298, x = sim_7_cast_fp16)[name = tensor("attn_3_cast_fp16")]; tensor x_73_transpose_x_0 = const()[name = tensor("x_73_transpose_x_0"), val = tensor(false)]; tensor x_73_transpose_y_0 = const()[name = tensor("x_73_transpose_y_0"), val = tensor(false)]; tensor v_3_cast_fp16 = transpose(perm = var_388, x = x_71_cast_fp16)[name = tensor("transpose_28")]; tensor x_73_cast_fp16 = matmul(transpose_x = x_73_transpose_x_0, transpose_y = x_73_transpose_y_0, x = attn_3_cast_fp16, y = v_3_cast_fp16)[name = tensor("x_73_cast_fp16")]; tensor var_414 = const()[name = tensor("op_414"), val = tensor([0, 2, 1, 3])]; tensor var_416 = const()[name = tensor("op_416"), val = tensor([1, 512, 512])]; tensor x_75_cast_fp16 = transpose(perm = var_414, x = x_73_cast_fp16)[name = tensor("transpose_25")]; tensor input_39_cast_fp16 = reshape(shape = var_416, x = x_75_cast_fp16)[name = tensor("input_39_cast_fp16")]; tensor transformer_blocks_1_attention_attention_to_out_weight_to_fp16 = const()[name = tensor("transformer_blocks_1_attention_attention_to_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25205888)))]; tensor transformer_blocks_1_attention_attention_to_out_bias_to_fp16 = const()[name = tensor("transformer_blocks_1_attention_attention_to_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26254528)))]; tensor linear_15_cast_fp16 = linear(bias = transformer_blocks_1_attention_attention_to_out_bias_to_fp16, weight = transformer_blocks_1_attention_attention_to_out_weight_to_fp16, x = input_39_cast_fp16)[name = tensor("linear_15_cast_fp16")]; tensor input_41_cast_fp16 = add(x = linear_15_cast_fp16, y = x_47_cast_fp16)[name = tensor("input_41_cast_fp16")]; tensor transformer_blocks_1_feed_forward_0_weight_to_fp16 = const()[name = tensor("transformer_blocks_1_feed_forward_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26256640)))]; tensor transformer_blocks_1_feed_forward_0_bias_to_fp16 = const()[name = tensor("transformer_blocks_1_feed_forward_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30451008)))]; tensor linear_16_cast_fp16 = linear(bias = transformer_blocks_1_feed_forward_0_bias_to_fp16, weight = transformer_blocks_1_feed_forward_0_weight_to_fp16, x = input_41_cast_fp16)[name = tensor("linear_16_cast_fp16")]; tensor input_45_mode_0 = const()[name = tensor("input_45_mode_0"), val = tensor("EXACT")]; tensor input_45_cast_fp16 = gelu(mode = input_45_mode_0, x = linear_16_cast_fp16)[name = tensor("input_45_cast_fp16")]; tensor transformer_blocks_1_feed_forward_2_weight_to_fp16 = const()[name = tensor("transformer_blocks_1_feed_forward_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30455168)))]; tensor transformer_blocks_1_feed_forward_2_bias_to_fp16 = const()[name = tensor("transformer_blocks_1_feed_forward_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34649536)))]; tensor linear_17_cast_fp16 = linear(bias = transformer_blocks_1_feed_forward_2_bias_to_fp16, weight = transformer_blocks_1_feed_forward_2_weight_to_fp16, x = input_45_cast_fp16)[name = tensor("linear_17_cast_fp16")]; tensor x_77_cast_fp16 = add(x = linear_17_cast_fp16, y = input_41_cast_fp16)[name = tensor("x_77_cast_fp16")]; tensor x_79_cast_fp16 = add(x = x_77_cast_fp16, y = mapping_cast_fp16)[name = tensor("x_79_cast_fp16")]; tensor var_443 = const()[name = tensor("op_443"), val = tensor(-1)]; tensor transformer_blocks_2_attention_norm_fc_weight_to_fp16 = const()[name = tensor("transformer_blocks_2_attention_norm_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34651648)))]; tensor transformer_blocks_2_attention_norm_fc_bias_to_fp16 = const()[name = tensor("transformer_blocks_2_attention_norm_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35700288)))]; tensor linear_18_cast_fp16 = linear(bias = transformer_blocks_2_attention_norm_fc_bias_to_fp16, weight = transformer_blocks_2_attention_norm_fc_weight_to_fp16, x = features_to_fp16)[name = tensor("linear_18_cast_fp16")]; tensor var_462 = const()[name = tensor("op_462"), val = tensor([1, 2048, 1])]; tensor h_19_cast_fp16 = reshape(shape = var_462, x = linear_18_cast_fp16)[name = tensor("h_19_cast_fp16")]; tensor var_464_split_sizes_0 = const()[name = tensor("op_464_split_sizes_0"), val = tensor([1024, 1024])]; tensor var_464_axis_0 = const()[name = tensor("op_464_axis_0"), val = tensor(1)]; tensor var_464_cast_fp16_0, tensor var_464_cast_fp16_1 = split(axis = var_464_axis_0, split_sizes = var_464_split_sizes_0, x = h_19_cast_fp16)[name = tensor("op_464_cast_fp16")]; tensor gamma_19_perm_0 = const()[name = tensor("gamma_19_perm_0"), val = tensor([0, -1, 1])]; tensor beta_19_perm_0 = const()[name = tensor("beta_19_perm_0"), val = tensor([0, -1, 1])]; tensor x_83_axes_0 = const()[name = tensor("x_83_axes_0"), val = tensor([-1])]; tensor var_436_to_fp16 = const()[name = tensor("op_436_to_fp16"), val = tensor(0x1.5p-17)]; tensor x_83_cast_fp16 = layer_norm(axes = x_83_axes_0, epsilon = var_436_to_fp16, x = x_79_cast_fp16)[name = tensor("x_83_cast_fp16")]; tensor var_470_promoted_to_fp16 = const()[name = tensor("op_470_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor gamma_19_cast_fp16 = transpose(perm = gamma_19_perm_0, x = var_464_cast_fp16_0)[name = tensor("transpose_24")]; tensor var_471_cast_fp16 = add(x = gamma_19_cast_fp16, y = var_470_promoted_to_fp16)[name = tensor("op_471_cast_fp16")]; tensor var_472_cast_fp16 = mul(x = var_471_cast_fp16, y = x_83_cast_fp16)[name = tensor("op_472_cast_fp16")]; tensor beta_19_cast_fp16 = transpose(perm = beta_19_perm_0, x = var_464_cast_fp16_1)[name = tensor("transpose_23")]; tensor x_85_cast_fp16 = add(x = var_472_cast_fp16, y = beta_19_cast_fp16)[name = tensor("x_85_cast_fp16")]; tensor transformer_blocks_2_attention_norm_context_fc_weight_to_fp16 = const()[name = tensor("transformer_blocks_2_attention_norm_context_fc_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35704448)))]; tensor transformer_blocks_2_attention_norm_context_fc_bias_to_fp16 = const()[name = tensor("transformer_blocks_2_attention_norm_context_fc_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36753088)))]; tensor linear_19_cast_fp16 = linear(bias = transformer_blocks_2_attention_norm_context_fc_bias_to_fp16, weight = transformer_blocks_2_attention_norm_context_fc_weight_to_fp16, x = features_to_fp16)[name = tensor("linear_19_cast_fp16")]; tensor var_484 = const()[name = tensor("op_484"), val = tensor([1, 2048, 1])]; tensor h_cast_fp16 = reshape(shape = var_484, x = linear_19_cast_fp16)[name = tensor("h_cast_fp16")]; tensor var_486_split_sizes_0 = const()[name = tensor("op_486_split_sizes_0"), val = tensor([1024, 1024])]; tensor var_486_axis_0 = const()[name = tensor("op_486_axis_0"), val = tensor(1)]; tensor var_486_cast_fp16_0, tensor var_486_cast_fp16_1 = split(axis = var_486_axis_0, split_sizes = var_486_split_sizes_0, x = h_cast_fp16)[name = tensor("op_486_cast_fp16")]; tensor gamma_perm_0 = const()[name = tensor("gamma_perm_0"), val = tensor([0, -1, 1])]; tensor beta_perm_0 = const()[name = tensor("beta_perm_0"), val = tensor([0, -1, 1])]; tensor var_492_promoted_to_fp16 = const()[name = tensor("op_492_promoted_to_fp16"), val = tensor(0x1p+0)]; tensor gamma_cast_fp16 = transpose(perm = gamma_perm_0, x = var_486_cast_fp16_0)[name = tensor("transpose_22")]; tensor var_493_cast_fp16 = add(x = gamma_cast_fp16, y = var_492_promoted_to_fp16)[name = tensor("op_493_cast_fp16")]; tensor var_494_cast_fp16 = mul(x = var_493_cast_fp16, y = x_83_cast_fp16)[name = tensor("op_494_cast_fp16")]; tensor beta_cast_fp16 = transpose(perm = beta_perm_0, x = var_486_cast_fp16_1)[name = tensor("transpose_21")]; tensor x_91_cast_fp16 = add(x = var_494_cast_fp16, y = beta_cast_fp16)[name = tensor("x_91_cast_fp16")]; tensor transformer_blocks_2_attention_to_q_weight_to_fp16 = const()[name = tensor("transformer_blocks_2_attention_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36757248)))]; tensor linear_20_cast_fp16 = linear(bias = linear_6_bias_0_to_fp16, weight = transformer_blocks_2_attention_to_q_weight_to_fp16, x = x_85_cast_fp16)[name = tensor("linear_20_cast_fp16")]; tensor transformer_blocks_2_attention_to_kv_weight_to_fp16 = const()[name = tensor("transformer_blocks_2_attention_to_kv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37805888)))]; tensor linear_21_cast_fp16 = linear(bias = linear_7_bias_0_to_fp16, weight = transformer_blocks_2_attention_to_kv_weight_to_fp16, x = x_91_cast_fp16)[name = tensor("linear_21_cast_fp16")]; tensor var_502_split_sizes_0 = const()[name = tensor("op_502_split_sizes_0"), val = tensor([512, 512])]; tensor var_502_axis_0 = const()[name = tensor("op_502_axis_0"), val = tensor(-1)]; tensor var_502_cast_fp16_0, tensor var_502_cast_fp16_1 = split(axis = var_502_axis_0, split_sizes = var_502_split_sizes_0, x = linear_21_cast_fp16)[name = tensor("op_502_cast_fp16")]; tensor var_511 = const()[name = tensor("op_511"), val = tensor([1, 512, 8, 64])]; tensor x_95_cast_fp16 = reshape(shape = var_511, x = linear_20_cast_fp16)[name = tensor("x_95_cast_fp16")]; tensor var_521 = const()[name = tensor("op_521"), val = tensor([1, 512, 8, 64])]; tensor x_99_cast_fp16 = reshape(shape = var_521, x = var_502_cast_fp16_0)[name = tensor("x_99_cast_fp16")]; tensor var_531 = const()[name = tensor("op_531"), val = tensor([1, 512, 8, 64])]; tensor x_103_cast_fp16 = reshape(shape = var_531, x = var_502_cast_fp16_1)[name = tensor("x_103_cast_fp16")]; tensor var_533 = const()[name = tensor("op_533"), val = tensor([0, 2, 1, 3])]; tensor sim_9_transpose_x_0 = const()[name = tensor("sim_9_transpose_x_0"), val = tensor(false)]; tensor sim_9_transpose_y_0 = const()[name = tensor("sim_9_transpose_y_0"), val = tensor(false)]; tensor transpose_13_perm_0 = const()[name = tensor("transpose_13_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_14_perm_0 = const()[name = tensor("transpose_14_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_14 = transpose(perm = transpose_14_perm_0, x = x_99_cast_fp16)[name = tensor("transpose_18")]; tensor transpose_13 = transpose(perm = transpose_13_perm_0, x = x_95_cast_fp16)[name = tensor("transpose_19")]; tensor sim_9_cast_fp16 = matmul(transpose_x = sim_9_transpose_x_0, transpose_y = sim_9_transpose_y_0, x = transpose_13, y = transpose_14)[name = tensor("sim_9_cast_fp16")]; tensor var_537_to_fp16 = const()[name = tensor("op_537_to_fp16"), val = tensor(0x1p-3)]; tensor sim_cast_fp16 = mul(x = sim_9_cast_fp16, y = var_537_to_fp16)[name = tensor("sim_cast_fp16")]; tensor attn_cast_fp16 = softmax(axis = var_443, x = sim_cast_fp16)[name = tensor("attn_cast_fp16")]; tensor x_105_transpose_x_0 = const()[name = tensor("x_105_transpose_x_0"), val = tensor(false)]; tensor x_105_transpose_y_0 = const()[name = tensor("x_105_transpose_y_0"), val = tensor(false)]; tensor v_cast_fp16 = transpose(perm = var_533, x = x_103_cast_fp16)[name = tensor("transpose_20")]; tensor x_105_cast_fp16 = matmul(transpose_x = x_105_transpose_x_0, transpose_y = x_105_transpose_y_0, x = attn_cast_fp16, y = v_cast_fp16)[name = tensor("x_105_cast_fp16")]; tensor var_559 = const()[name = tensor("op_559"), val = tensor([0, 2, 1, 3])]; tensor var_561 = const()[name = tensor("op_561"), val = tensor([1, 512, 512])]; tensor x_107_cast_fp16 = transpose(perm = var_559, x = x_105_cast_fp16)[name = tensor("transpose_17")]; tensor input_55_cast_fp16 = reshape(shape = var_561, x = x_107_cast_fp16)[name = tensor("input_55_cast_fp16")]; tensor transformer_blocks_2_attention_attention_to_out_weight_to_fp16 = const()[name = tensor("transformer_blocks_2_attention_attention_to_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39903104)))]; tensor transformer_blocks_2_attention_attention_to_out_bias_to_fp16 = const()[name = tensor("transformer_blocks_2_attention_attention_to_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40951744)))]; tensor linear_22_cast_fp16 = linear(bias = transformer_blocks_2_attention_attention_to_out_bias_to_fp16, weight = transformer_blocks_2_attention_attention_to_out_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("linear_22_cast_fp16")]; tensor input_57_cast_fp16 = add(x = linear_22_cast_fp16, y = x_79_cast_fp16)[name = tensor("input_57_cast_fp16")]; tensor transformer_blocks_2_feed_forward_0_weight_to_fp16 = const()[name = tensor("transformer_blocks_2_feed_forward_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40953856)))]; tensor transformer_blocks_2_feed_forward_0_bias_to_fp16 = const()[name = tensor("transformer_blocks_2_feed_forward_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45148224)))]; tensor linear_23_cast_fp16 = linear(bias = transformer_blocks_2_feed_forward_0_bias_to_fp16, weight = transformer_blocks_2_feed_forward_0_weight_to_fp16, x = input_57_cast_fp16)[name = tensor("linear_23_cast_fp16")]; tensor input_61_mode_0 = const()[name = tensor("input_61_mode_0"), val = tensor("EXACT")]; tensor input_61_cast_fp16 = gelu(mode = input_61_mode_0, x = linear_23_cast_fp16)[name = tensor("input_61_cast_fp16")]; tensor transformer_blocks_2_feed_forward_2_weight_to_fp16 = const()[name = tensor("transformer_blocks_2_feed_forward_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45152384)))]; tensor transformer_blocks_2_feed_forward_2_bias_to_fp16 = const()[name = tensor("transformer_blocks_2_feed_forward_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49346752)))]; tensor linear_24_cast_fp16 = linear(bias = transformer_blocks_2_feed_forward_2_bias_to_fp16, weight = transformer_blocks_2_feed_forward_2_weight_to_fp16, x = input_61_cast_fp16)[name = tensor("linear_24_cast_fp16")]; tensor x_109_cast_fp16 = add(x = linear_24_cast_fp16, y = input_57_cast_fp16)[name = tensor("x_109_cast_fp16")]; tensor var_581_axes_0 = const()[name = tensor("op_581_axes_0"), val = tensor([1])]; tensor var_581_keep_dims_0 = const()[name = tensor("op_581_keep_dims_0"), val = tensor(false)]; tensor var_581_cast_fp16 = reduce_mean(axes = var_581_axes_0, keep_dims = var_581_keep_dims_0, x = x_109_cast_fp16)[name = tensor("op_581_cast_fp16")]; tensor x_111_axes_0 = const()[name = tensor("x_111_axes_0"), val = tensor([1])]; tensor x_111_cast_fp16 = expand_dims(axes = x_111_axes_0, x = var_581_cast_fp16)[name = tensor("x_111_cast_fp16")]; tensor var_590 = const()[name = tensor("op_590"), val = tensor([0, 2, 1])]; tensor x_pad_type_0 = const()[name = tensor("x_pad_type_0"), val = tensor("valid")]; tensor x_strides_0 = const()[name = tensor("x_strides_0"), val = tensor([1])]; tensor x_pad_0 = const()[name = tensor("x_pad_0"), val = tensor([0, 0])]; tensor x_dilations_0 = const()[name = tensor("x_dilations_0"), val = tensor([1])]; tensor x_groups_0 = const()[name = tensor("x_groups_0"), val = tensor(1)]; tensor transformer_to_out_1_weight_to_fp16 = const()[name = tensor("transformer_to_out_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49348864)))]; tensor transformer_to_out_1_bias_to_fp16 = const()[name = tensor("transformer_to_out_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(49873216)))]; tensor input_cast_fp16 = transpose(perm = var_590, x = x_111_cast_fp16)[name = tensor("transpose_16")]; tensor x_cast_fp16 = conv(bias = transformer_to_out_1_bias_to_fp16, dilations = x_dilations_0, groups = x_groups_0, pad = x_pad_0, pad_type = x_pad_type_0, strides = x_strides_0, weight = transformer_to_out_1_weight_to_fp16, x = input_cast_fp16)[name = tensor("x_cast_fp16")]; tensor x_pred_perm_0 = const()[name = tensor("x_pred_perm_0"), val = tensor([0, -1, -2])]; tensor var_602_cast_fp16 = mul(x = c_skip_cast_fp16, y = x_noisy_to_fp16)[name = tensor("op_602_cast_fp16")]; tensor x_pred_cast_fp16 = transpose(perm = x_pred_perm_0, x = x_cast_fp16)[name = tensor("transpose_15")]; tensor var_603_cast_fp16 = mul(x = c_out_cast_fp16, y = x_pred_cast_fp16)[name = tensor("op_603_cast_fp16")]; tensor denoised = add(x = var_602_cast_fp16, y = var_603_cast_fp16)[name = tensor("op_605_cast_fp16")]; } -> (denoised); }