diff --git "a/SD TURBO FULL SE CHUNK 384x384/Unet.mlmodelc/model.mil" "b/SD TURBO FULL SE CHUNK 384x384/Unet.mlmodelc/model.mil" new file mode 100644--- /dev/null +++ "b/SD TURBO FULL SE CHUNK 384x384/Unet.mlmodelc/model.mil" @@ -0,0 +1,11766 @@ +program(1.0) +[buildInfo = dict, tensor>({{"coremlc-component-MIL", "5.33.5"}, {"coremlc-version", "1877.40.3"}, {"coremltools-component-torch", "2.0.1"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "7.1"}})] +{ + func main(tensor encoder_hidden_states, tensor sample, tensor timestep) { + tensor var_25 = const()[name = tensor("op_25"), val = tensor(-1)]; + tensor var_42_axes_0 = const()[name = tensor("op_42_axes_0"), val = tensor([1])]; + tensor var_42_cast_fp16 = expand_dims(axes = var_42_axes_0, x = timestep)[name = tensor("op_42_cast_fp16")]; + tensor var_44_to_fp16 = const()[name = tensor("op_44_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; + tensor emb_3_cast_fp16 = mul(x = var_42_cast_fp16, y = var_44_to_fp16)[name = tensor("emb_3_cast_fp16")]; + tensor var_49_cast_fp16 = sin(x = emb_3_cast_fp16)[name = tensor("op_49_cast_fp16")]; + tensor var_50_cast_fp16 = cos(x = emb_3_cast_fp16)[name = tensor("op_50_cast_fp16")]; + tensor emb_interleave_0 = const()[name = tensor("emb_interleave_0"), val = tensor(false)]; + tensor emb_cast_fp16 = concat(axis = var_25, interleave = emb_interleave_0, values = (var_49_cast_fp16, var_50_cast_fp16))[name = tensor("emb_cast_fp16")]; + tensor var_54_begin_0 = const()[name = tensor("op_54_begin_0"), val = tensor([0, 160])]; + tensor var_54_end_0 = const()[name = tensor("op_54_end_0"), val = tensor([2, 320])]; + tensor var_54_end_mask_0 = const()[name = tensor("op_54_end_mask_0"), val = tensor([true, true])]; + tensor var_54_cast_fp16 = slice_by_index(begin = var_54_begin_0, end = var_54_end_0, end_mask = var_54_end_mask_0, x = emb_cast_fp16)[name = tensor("op_54_cast_fp16")]; + tensor var_56_begin_0 = const()[name = tensor("op_56_begin_0"), val = tensor([0, 0])]; + tensor var_56_end_0 = const()[name = tensor("op_56_end_0"), val = tensor([2, 160])]; + tensor var_56_end_mask_0 = const()[name = tensor("op_56_end_mask_0"), val = tensor([true, false])]; + tensor var_56_cast_fp16 = slice_by_index(begin = var_56_begin_0, end = var_56_end_0, end_mask = var_56_end_mask_0, x = emb_cast_fp16)[name = tensor("op_56_cast_fp16")]; + tensor sample_interleave_0 = const()[name = tensor("sample_interleave_0"), val = tensor(false)]; + tensor sample_cast_fp16 = concat(axis = var_25, interleave = sample_interleave_0, values = (var_54_cast_fp16, var_56_cast_fp16))[name = tensor("sample_cast_fp16")]; + tensor var_59 = const()[name = tensor("op_59"), val = tensor(1)]; + tensor var_66_axes_0 = const()[name = tensor("op_66_axes_0"), val = tensor([-1])]; + tensor var_66_cast_fp16 = expand_dims(axes = var_66_axes_0, x = sample_cast_fp16)[name = tensor("op_66_cast_fp16")]; + tensor input_1_axes_0 = const()[name = tensor("input_1_axes_0"), val = tensor([-1])]; + tensor input_1_cast_fp16 = expand_dims(axes = input_1_axes_0, x = var_66_cast_fp16)[name = tensor("input_1_cast_fp16")]; + tensor var_70 = const()[name = tensor("op_70"), val = tensor([1, 1])]; + tensor var_72 = const()[name = tensor("op_72"), val = tensor([1, 1])]; + tensor input_3_pad_type_0 = const()[name = tensor("input_3_pad_type_0"), val = tensor("custom")]; + tensor input_3_pad_0 = const()[name = tensor("input_3_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor time_embedding_linear_1_weight_to_fp16 = const()[name = tensor("time_embedding_linear_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448)))]; + tensor time_embedding_linear_1_bias_to_fp16 = const()[name = tensor("time_embedding_linear_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(819712)))]; + tensor input_3_cast_fp16 = conv(bias = time_embedding_linear_1_bias_to_fp16, dilations = var_72, groups = var_59, pad = input_3_pad_0, pad_type = input_3_pad_type_0, strides = var_70, weight = time_embedding_linear_1_weight_to_fp16, x = input_1_cast_fp16)[name = tensor("input_3_cast_fp16")]; + tensor input_5_cast_fp16 = silu(x = input_3_cast_fp16)[name = tensor("input_5_cast_fp16")]; + tensor var_78 = const()[name = tensor("op_78"), val = tensor([1, 1])]; + tensor var_80 = const()[name = tensor("op_80"), val = tensor([1, 1])]; + tensor input_13_pad_type_0 = const()[name = tensor("input_13_pad_type_0"), val = tensor("custom")]; + tensor input_13_pad_0 = const()[name = tensor("input_13_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor time_embedding_linear_2_weight_to_fp16 = const()[name = tensor("time_embedding_linear_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(822336)))]; + tensor time_embedding_linear_2_bias_to_fp16 = const()[name = tensor("time_embedding_linear_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4099200)))]; + tensor input_13_cast_fp16 = conv(bias = time_embedding_linear_2_bias_to_fp16, dilations = var_80, groups = var_59, pad = input_13_pad_0, pad_type = input_13_pad_type_0, strides = var_78, weight = time_embedding_linear_2_weight_to_fp16, x = input_5_cast_fp16)[name = tensor("input_13_cast_fp16")]; + tensor var_86 = const()[name = tensor("op_86"), val = tensor(1)]; + tensor var_89 = const()[name = tensor("op_89"), val = tensor([1, 1])]; + tensor var_91 = const()[name = tensor("op_91"), val = tensor([1, 1])]; + tensor input_7_pad_type_0 = const()[name = tensor("input_7_pad_type_0"), val = tensor("custom")]; + tensor input_7_pad_0 = const()[name = tensor("input_7_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor conv_in_weight_to_fp16 = const()[name = tensor("conv_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4101824)))]; + tensor conv_in_bias_to_fp16 = const()[name = tensor("conv_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4124928)))]; + tensor input_7_cast_fp16 = conv(bias = conv_in_bias_to_fp16, dilations = var_91, groups = var_86, pad = input_7_pad_0, pad_type = input_7_pad_type_0, strides = var_89, weight = conv_in_weight_to_fp16, x = sample)[name = tensor("input_7_cast_fp16")]; + tensor var_107 = const()[name = tensor("op_107"), val = tensor(true)]; + tensor var_112 = const()[name = tensor("op_112"), val = tensor(1)]; + tensor reshape_0_shape_0 = const()[name = tensor("reshape_0_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_0_cast_fp16 = reshape(shape = reshape_0_shape_0, x = input_7_cast_fp16)[name = tensor("reshape_0_cast_fp16")]; + tensor reduce_mean_0_axes_0 = const()[name = tensor("reduce_mean_0_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_0_keep_dims_0 = const()[name = tensor("reduce_mean_0_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_0_cast_fp16 = reduce_mean(axes = reduce_mean_0_axes_0, keep_dims = reduce_mean_0_keep_dims_0, x = reshape_0_cast_fp16)[name = tensor("reduce_mean_0_cast_fp16")]; + tensor sub_0_cast_fp16 = sub(x = reshape_0_cast_fp16, y = reduce_mean_0_cast_fp16)[name = tensor("sub_0_cast_fp16")]; + tensor square_0_cast_fp16 = square(x = sub_0_cast_fp16)[name = tensor("square_0_cast_fp16")]; + tensor reduce_mean_2_axes_0 = const()[name = tensor("reduce_mean_2_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_2_keep_dims_0 = const()[name = tensor("reduce_mean_2_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_2_cast_fp16 = reduce_mean(axes = reduce_mean_2_axes_0, keep_dims = reduce_mean_2_keep_dims_0, x = square_0_cast_fp16)[name = tensor("reduce_mean_2_cast_fp16")]; + tensor add_0_y_0_to_fp16 = const()[name = tensor("add_0_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_0_cast_fp16 = add(x = reduce_mean_2_cast_fp16, y = add_0_y_0_to_fp16)[name = tensor("add_0_cast_fp16")]; + tensor sqrt_0_cast_fp16 = sqrt(x = add_0_cast_fp16)[name = tensor("sqrt_0_cast_fp16")]; + tensor real_div_0_cast_fp16 = real_div(x = sub_0_cast_fp16, y = sqrt_0_cast_fp16)[name = tensor("real_div_0_cast_fp16")]; + tensor reshape_1_shape_0 = const()[name = tensor("reshape_1_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_1_cast_fp16 = reshape(shape = reshape_1_shape_0, x = real_div_0_cast_fp16)[name = tensor("reshape_1_cast_fp16")]; + tensor add_1_mean_0_to_fp16 = const()[name = tensor("add_1_mean_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4125632)))]; + tensor add_1_variance_0_to_fp16 = const()[name = tensor("add_1_variance_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4126336)))]; + tensor add_1_gamma_0_to_fp16 = const()[name = tensor("add_1_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4127040)))]; + tensor add_1_beta_0_to_fp16 = const()[name = tensor("add_1_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4127744)))]; + tensor add_1_epsilon_0_to_fp16 = const()[name = tensor("add_1_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_1_cast_fp16 = batch_norm(beta = add_1_beta_0_to_fp16, epsilon = add_1_epsilon_0_to_fp16, gamma = add_1_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_1_cast_fp16)[name = tensor("add_1_cast_fp16")]; + tensor input_11_cast_fp16 = silu(x = add_1_cast_fp16)[name = tensor("input_11_cast_fp16")]; + tensor var_134 = const()[name = tensor("op_134"), val = tensor([1, 1])]; + tensor var_136 = const()[name = tensor("op_136"), val = tensor([1, 1])]; + tensor hidden_states_1_pad_type_0 = const()[name = tensor("hidden_states_1_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_1_pad_0 = const()[name = tensor("hidden_states_1_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_0_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4128448)))]; + tensor down_blocks_0_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5971712)))]; + tensor hidden_states_1_cast_fp16 = conv(bias = down_blocks_0_resnets_0_conv1_bias_to_fp16, dilations = var_136, groups = var_112, pad = hidden_states_1_pad_0, pad_type = hidden_states_1_pad_type_0, strides = var_134, weight = down_blocks_0_resnets_0_conv1_weight_to_fp16, x = input_11_cast_fp16)[name = tensor("hidden_states_1_cast_fp16")]; + tensor input_15_cast_fp16 = silu(x = input_13_cast_fp16)[name = tensor("input_15_cast_fp16")]; + tensor var_142 = const()[name = tensor("op_142"), val = tensor([1, 1])]; + tensor var_144 = const()[name = tensor("op_144"), val = tensor([1, 1])]; + tensor temb_1_pad_type_0 = const()[name = tensor("temb_1_pad_type_0"), val = tensor("custom")]; + tensor temb_1_pad_0 = const()[name = tensor("temb_1_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5972416)))]; + tensor down_blocks_0_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6791680)))]; + tensor temb_1_cast_fp16 = conv(bias = down_blocks_0_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_144, groups = var_112, pad = temb_1_pad_0, pad_type = temb_1_pad_type_0, strides = var_142, weight = down_blocks_0_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_1_cast_fp16")]; + tensor input_17_cast_fp16 = add(x = hidden_states_1_cast_fp16, y = temb_1_cast_fp16)[name = tensor("input_17_cast_fp16")]; + tensor reshape_4_shape_0 = const()[name = tensor("reshape_4_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_4_cast_fp16 = reshape(shape = reshape_4_shape_0, x = input_17_cast_fp16)[name = tensor("reshape_4_cast_fp16")]; + tensor reduce_mean_3_axes_0 = const()[name = tensor("reduce_mean_3_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_3_keep_dims_0 = const()[name = tensor("reduce_mean_3_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_3_cast_fp16 = reduce_mean(axes = reduce_mean_3_axes_0, keep_dims = reduce_mean_3_keep_dims_0, x = reshape_4_cast_fp16)[name = tensor("reduce_mean_3_cast_fp16")]; + tensor sub_2_cast_fp16 = sub(x = reshape_4_cast_fp16, y = reduce_mean_3_cast_fp16)[name = tensor("sub_2_cast_fp16")]; + tensor square_1_cast_fp16 = square(x = sub_2_cast_fp16)[name = tensor("square_1_cast_fp16")]; + tensor reduce_mean_5_axes_0 = const()[name = tensor("reduce_mean_5_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_5_keep_dims_0 = const()[name = tensor("reduce_mean_5_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_5_cast_fp16 = reduce_mean(axes = reduce_mean_5_axes_0, keep_dims = reduce_mean_5_keep_dims_0, x = square_1_cast_fp16)[name = tensor("reduce_mean_5_cast_fp16")]; + tensor add_2_y_0_to_fp16 = const()[name = tensor("add_2_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_2_cast_fp16 = add(x = reduce_mean_5_cast_fp16, y = add_2_y_0_to_fp16)[name = tensor("add_2_cast_fp16")]; + tensor sqrt_1_cast_fp16 = sqrt(x = add_2_cast_fp16)[name = tensor("sqrt_1_cast_fp16")]; + tensor real_div_1_cast_fp16 = real_div(x = sub_2_cast_fp16, y = sqrt_1_cast_fp16)[name = tensor("real_div_1_cast_fp16")]; + tensor reshape_5_shape_0 = const()[name = tensor("reshape_5_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_5_cast_fp16 = reshape(shape = reshape_5_shape_0, x = real_div_1_cast_fp16)[name = tensor("reshape_5_cast_fp16")]; + tensor add_3_gamma_0_to_fp16 = const()[name = tensor("add_3_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6792384)))]; + tensor add_3_beta_0_to_fp16 = const()[name = tensor("add_3_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6793088)))]; + tensor add_3_epsilon_0_to_fp16 = const()[name = tensor("add_3_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_3_cast_fp16 = batch_norm(beta = add_3_beta_0_to_fp16, epsilon = add_3_epsilon_0_to_fp16, gamma = add_3_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_5_cast_fp16)[name = tensor("add_3_cast_fp16")]; + tensor input_21_cast_fp16 = silu(x = add_3_cast_fp16)[name = tensor("input_21_cast_fp16")]; + tensor var_154 = const()[name = tensor("op_154"), val = tensor([1, 1])]; + tensor var_156 = const()[name = tensor("op_156"), val = tensor([1, 1])]; + tensor hidden_states_3_pad_type_0 = const()[name = tensor("hidden_states_3_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_3_pad_0 = const()[name = tensor("hidden_states_3_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_0_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6793792)))]; + tensor down_blocks_0_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8637056)))]; + tensor hidden_states_3_cast_fp16 = conv(bias = down_blocks_0_resnets_0_conv2_bias_to_fp16, dilations = var_156, groups = var_112, pad = hidden_states_3_pad_0, pad_type = hidden_states_3_pad_type_0, strides = var_154, weight = down_blocks_0_resnets_0_conv2_weight_to_fp16, x = input_21_cast_fp16)[name = tensor("hidden_states_3_cast_fp16")]; + tensor hidden_states_5_cast_fp16 = add(x = input_7_cast_fp16, y = hidden_states_3_cast_fp16)[name = tensor("hidden_states_5_cast_fp16")]; + tensor reshape_8_shape_0 = const()[name = tensor("reshape_8_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_8_cast_fp16 = reshape(shape = reshape_8_shape_0, x = hidden_states_5_cast_fp16)[name = tensor("reshape_8_cast_fp16")]; + tensor reduce_mean_6_axes_0 = const()[name = tensor("reduce_mean_6_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_6_keep_dims_0 = const()[name = tensor("reduce_mean_6_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_6_cast_fp16 = reduce_mean(axes = reduce_mean_6_axes_0, keep_dims = reduce_mean_6_keep_dims_0, x = reshape_8_cast_fp16)[name = tensor("reduce_mean_6_cast_fp16")]; + tensor sub_4_cast_fp16 = sub(x = reshape_8_cast_fp16, y = reduce_mean_6_cast_fp16)[name = tensor("sub_4_cast_fp16")]; + tensor square_2_cast_fp16 = square(x = sub_4_cast_fp16)[name = tensor("square_2_cast_fp16")]; + tensor reduce_mean_8_axes_0 = const()[name = tensor("reduce_mean_8_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_8_keep_dims_0 = const()[name = tensor("reduce_mean_8_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_8_cast_fp16 = reduce_mean(axes = reduce_mean_8_axes_0, keep_dims = reduce_mean_8_keep_dims_0, x = square_2_cast_fp16)[name = tensor("reduce_mean_8_cast_fp16")]; + tensor add_4_y_0_to_fp16 = const()[name = tensor("add_4_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_4_cast_fp16 = add(x = reduce_mean_8_cast_fp16, y = add_4_y_0_to_fp16)[name = tensor("add_4_cast_fp16")]; + tensor sqrt_2_cast_fp16 = sqrt(x = add_4_cast_fp16)[name = tensor("sqrt_2_cast_fp16")]; + tensor real_div_2_cast_fp16 = real_div(x = sub_4_cast_fp16, y = sqrt_2_cast_fp16)[name = tensor("real_div_2_cast_fp16")]; + tensor reshape_9_shape_0 = const()[name = tensor("reshape_9_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_9_cast_fp16 = reshape(shape = reshape_9_shape_0, x = real_div_2_cast_fp16)[name = tensor("reshape_9_cast_fp16")]; + tensor add_5_gamma_0_to_fp16 = const()[name = tensor("add_5_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8637760)))]; + tensor add_5_beta_0_to_fp16 = const()[name = tensor("add_5_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8638464)))]; + tensor add_5_epsilon_0_to_fp16 = const()[name = tensor("add_5_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_5_cast_fp16 = batch_norm(beta = add_5_beta_0_to_fp16, epsilon = add_5_epsilon_0_to_fp16, gamma = add_5_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_9_cast_fp16)[name = tensor("add_5_cast_fp16")]; + tensor var_176 = const()[name = tensor("op_176"), val = tensor([1, 1])]; + tensor var_178 = const()[name = tensor("op_178"), val = tensor([1, 1])]; + tensor hidden_states_7_pad_type_0 = const()[name = tensor("hidden_states_7_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_7_pad_0 = const()[name = tensor("hidden_states_7_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8639168)))]; + tensor down_blocks_0_attentions_0_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8844032)))]; + tensor hidden_states_7_cast_fp16 = conv(bias = down_blocks_0_attentions_0_proj_in_bias_to_fp16, dilations = var_178, groups = var_112, pad = hidden_states_7_pad_0, pad_type = hidden_states_7_pad_type_0, strides = var_176, weight = down_blocks_0_attentions_0_proj_in_weight_to_fp16, x = add_5_cast_fp16)[name = tensor("hidden_states_7_cast_fp16")]; + tensor var_183 = const()[name = tensor("op_183"), val = tensor([2, 320, 1, 2304])]; + tensor inputs_1_cast_fp16 = reshape(shape = var_183, x = hidden_states_7_cast_fp16)[name = tensor("inputs_1_cast_fp16")]; + tensor var_193 = const()[name = tensor("op_193"), val = tensor([1])]; + tensor channels_mean_1_cast_fp16 = reduce_mean(axes = var_193, keep_dims = var_107, x = inputs_1_cast_fp16)[name = tensor("channels_mean_1_cast_fp16")]; + tensor zero_mean_1_cast_fp16 = sub(x = inputs_1_cast_fp16, y = channels_mean_1_cast_fp16)[name = tensor("zero_mean_1_cast_fp16")]; + tensor zero_mean_sq_1_cast_fp16 = mul(x = zero_mean_1_cast_fp16, y = zero_mean_1_cast_fp16)[name = tensor("zero_mean_sq_1_cast_fp16")]; + tensor var_197 = const()[name = tensor("op_197"), val = tensor([1])]; + tensor var_198_cast_fp16 = reduce_mean(axes = var_197, keep_dims = var_107, x = zero_mean_sq_1_cast_fp16)[name = tensor("op_198_cast_fp16")]; + tensor var_199_to_fp16 = const()[name = tensor("op_199_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_200_cast_fp16 = add(x = var_198_cast_fp16, y = var_199_to_fp16)[name = tensor("op_200_cast_fp16")]; + tensor denom_1_epsilon_0_to_fp16 = const()[name = tensor("denom_1_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_1_cast_fp16 = rsqrt(epsilon = denom_1_epsilon_0_to_fp16, x = var_200_cast_fp16)[name = tensor("denom_1_cast_fp16")]; + tensor out_1_cast_fp16 = mul(x = zero_mean_1_cast_fp16, y = denom_1_cast_fp16)[name = tensor("out_1_cast_fp16")]; + tensor var_204_to_fp16 = const()[name = tensor("op_204_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8844736)))]; + tensor var_205_cast_fp16 = add(x = out_1_cast_fp16, y = var_204_to_fp16)[name = tensor("op_205_cast_fp16")]; + tensor var_207_to_fp16 = const()[name = tensor("op_207_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8845440)))]; + tensor hidden_states_9_cast_fp16 = mul(x = var_205_cast_fp16, y = var_207_to_fp16)[name = tensor("hidden_states_9_cast_fp16")]; + tensor var_214 = const()[name = tensor("op_214"), val = tensor([1, 1])]; + tensor var_216 = const()[name = tensor("op_216"), val = tensor([1, 1])]; + tensor q_1_pad_type_0 = const()[name = tensor("q_1_pad_type_0"), val = tensor("custom")]; + tensor q_1_pad_0 = const()[name = tensor("q_1_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8846144)))]; + tensor q_1_cast_fp16 = conv(dilations = var_216, groups = var_112, pad = q_1_pad_0, pad_type = q_1_pad_type_0, strides = var_214, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_9_cast_fp16)[name = tensor("q_1_cast_fp16")]; + tensor var_220 = const()[name = tensor("op_220"), val = tensor([1, 1])]; + tensor var_222 = const()[name = tensor("op_222"), val = tensor([1, 1])]; + tensor k_1_pad_type_0 = const()[name = tensor("k_1_pad_type_0"), val = tensor("custom")]; + tensor k_1_pad_0 = const()[name = tensor("k_1_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9051008)))]; + tensor k_1_cast_fp16 = conv(dilations = var_222, groups = var_112, pad = k_1_pad_0, pad_type = k_1_pad_type_0, strides = var_220, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_9_cast_fp16)[name = tensor("k_1_cast_fp16")]; + tensor var_226 = const()[name = tensor("op_226"), val = tensor([1, 1])]; + tensor var_228 = const()[name = tensor("op_228"), val = tensor([1, 1])]; + tensor v_1_pad_type_0 = const()[name = tensor("v_1_pad_type_0"), val = tensor("custom")]; + tensor v_1_pad_0 = const()[name = tensor("v_1_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9255872)))]; + tensor v_1_cast_fp16 = conv(dilations = var_228, groups = var_112, pad = v_1_pad_0, pad_type = v_1_pad_type_0, strides = var_226, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_9_cast_fp16)[name = tensor("v_1_cast_fp16")]; + tensor var_232_begin_0 = const()[name = tensor("op_232_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_232_end_0 = const()[name = tensor("op_232_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_232_end_mask_0 = const()[name = tensor("op_232_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_232_cast_fp16 = slice_by_index(begin = var_232_begin_0, end = var_232_end_0, end_mask = var_232_end_mask_0, x = q_1_cast_fp16)[name = tensor("op_232_cast_fp16")]; + tensor var_236_begin_0 = const()[name = tensor("op_236_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_236_end_0 = const()[name = tensor("op_236_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_236_end_mask_0 = const()[name = tensor("op_236_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_236_cast_fp16 = slice_by_index(begin = var_236_begin_0, end = var_236_end_0, end_mask = var_236_end_mask_0, x = q_1_cast_fp16)[name = tensor("op_236_cast_fp16")]; + tensor var_240_begin_0 = const()[name = tensor("op_240_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_240_end_0 = const()[name = tensor("op_240_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_240_end_mask_0 = const()[name = tensor("op_240_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_240_cast_fp16 = slice_by_index(begin = var_240_begin_0, end = var_240_end_0, end_mask = var_240_end_mask_0, x = q_1_cast_fp16)[name = tensor("op_240_cast_fp16")]; + tensor var_244_begin_0 = const()[name = tensor("op_244_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_244_end_0 = const()[name = tensor("op_244_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_244_end_mask_0 = const()[name = tensor("op_244_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_244_cast_fp16 = slice_by_index(begin = var_244_begin_0, end = var_244_end_0, end_mask = var_244_end_mask_0, x = q_1_cast_fp16)[name = tensor("op_244_cast_fp16")]; + tensor var_248_begin_0 = const()[name = tensor("op_248_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_248_end_0 = const()[name = tensor("op_248_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_248_end_mask_0 = const()[name = tensor("op_248_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_248_cast_fp16 = slice_by_index(begin = var_248_begin_0, end = var_248_end_0, end_mask = var_248_end_mask_0, x = q_1_cast_fp16)[name = tensor("op_248_cast_fp16")]; + tensor k_3_perm_0 = const()[name = tensor("k_3_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_255_begin_0 = const()[name = tensor("op_255_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_255_end_0 = const()[name = tensor("op_255_end_0"), val = tensor([2, 2304, 1, 64])]; + tensor var_255_end_mask_0 = const()[name = tensor("op_255_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_31 = transpose(perm = k_3_perm_0, x = k_1_cast_fp16)[name = tensor("transpose_31")]; + tensor var_255_cast_fp16 = slice_by_index(begin = var_255_begin_0, end = var_255_end_0, end_mask = var_255_end_mask_0, x = transpose_31)[name = tensor("op_255_cast_fp16")]; + tensor var_259_begin_0 = const()[name = tensor("op_259_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_259_end_0 = const()[name = tensor("op_259_end_0"), val = tensor([2, 2304, 1, 128])]; + tensor var_259_end_mask_0 = const()[name = tensor("op_259_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_259_cast_fp16 = slice_by_index(begin = var_259_begin_0, end = var_259_end_0, end_mask = var_259_end_mask_0, x = transpose_31)[name = tensor("op_259_cast_fp16")]; + tensor var_263_begin_0 = const()[name = tensor("op_263_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_263_end_0 = const()[name = tensor("op_263_end_0"), val = tensor([2, 2304, 1, 192])]; + tensor var_263_end_mask_0 = const()[name = tensor("op_263_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_263_cast_fp16 = slice_by_index(begin = var_263_begin_0, end = var_263_end_0, end_mask = var_263_end_mask_0, x = transpose_31)[name = tensor("op_263_cast_fp16")]; + tensor var_267_begin_0 = const()[name = tensor("op_267_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_267_end_0 = const()[name = tensor("op_267_end_0"), val = tensor([2, 2304, 1, 256])]; + tensor var_267_end_mask_0 = const()[name = tensor("op_267_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_267_cast_fp16 = slice_by_index(begin = var_267_begin_0, end = var_267_end_0, end_mask = var_267_end_mask_0, x = transpose_31)[name = tensor("op_267_cast_fp16")]; + tensor var_271_begin_0 = const()[name = tensor("op_271_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_271_end_0 = const()[name = tensor("op_271_end_0"), val = tensor([2, 2304, 1, 320])]; + tensor var_271_end_mask_0 = const()[name = tensor("op_271_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_271_cast_fp16 = slice_by_index(begin = var_271_begin_0, end = var_271_end_0, end_mask = var_271_end_mask_0, x = transpose_31)[name = tensor("op_271_cast_fp16")]; + tensor var_273_begin_0 = const()[name = tensor("op_273_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_273_end_0 = const()[name = tensor("op_273_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_273_end_mask_0 = const()[name = tensor("op_273_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_273_cast_fp16 = slice_by_index(begin = var_273_begin_0, end = var_273_end_0, end_mask = var_273_end_mask_0, x = v_1_cast_fp16)[name = tensor("op_273_cast_fp16")]; + tensor var_277_begin_0 = const()[name = tensor("op_277_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_277_end_0 = const()[name = tensor("op_277_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_277_end_mask_0 = const()[name = tensor("op_277_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_277_cast_fp16 = slice_by_index(begin = var_277_begin_0, end = var_277_end_0, end_mask = var_277_end_mask_0, x = v_1_cast_fp16)[name = tensor("op_277_cast_fp16")]; + tensor var_281_begin_0 = const()[name = tensor("op_281_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_281_end_0 = const()[name = tensor("op_281_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_281_end_mask_0 = const()[name = tensor("op_281_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_281_cast_fp16 = slice_by_index(begin = var_281_begin_0, end = var_281_end_0, end_mask = var_281_end_mask_0, x = v_1_cast_fp16)[name = tensor("op_281_cast_fp16")]; + tensor var_285_begin_0 = const()[name = tensor("op_285_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_285_end_0 = const()[name = tensor("op_285_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_285_end_mask_0 = const()[name = tensor("op_285_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_285_cast_fp16 = slice_by_index(begin = var_285_begin_0, end = var_285_end_0, end_mask = var_285_end_mask_0, x = v_1_cast_fp16)[name = tensor("op_285_cast_fp16")]; + tensor var_289_begin_0 = const()[name = tensor("op_289_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_289_end_0 = const()[name = tensor("op_289_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_289_end_mask_0 = const()[name = tensor("op_289_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_289_cast_fp16 = slice_by_index(begin = var_289_begin_0, end = var_289_end_0, end_mask = var_289_end_mask_0, x = v_1_cast_fp16)[name = tensor("op_289_cast_fp16")]; + tensor var_293_equation_0 = const()[name = tensor("op_293_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_293_cast_fp16 = einsum(equation = var_293_equation_0, values = (var_255_cast_fp16, var_232_cast_fp16))[name = tensor("op_293_cast_fp16")]; + tensor var_294_to_fp16 = const()[name = tensor("op_294_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_1_cast_fp16 = mul(x = var_293_cast_fp16, y = var_294_to_fp16)[name = tensor("aw_1_cast_fp16")]; + tensor var_297_equation_0 = const()[name = tensor("op_297_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_297_cast_fp16 = einsum(equation = var_297_equation_0, values = (var_259_cast_fp16, var_236_cast_fp16))[name = tensor("op_297_cast_fp16")]; + tensor var_298_to_fp16 = const()[name = tensor("op_298_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_3_cast_fp16 = mul(x = var_297_cast_fp16, y = var_298_to_fp16)[name = tensor("aw_3_cast_fp16")]; + tensor var_301_equation_0 = const()[name = tensor("op_301_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_301_cast_fp16 = einsum(equation = var_301_equation_0, values = (var_263_cast_fp16, var_240_cast_fp16))[name = tensor("op_301_cast_fp16")]; + tensor var_302_to_fp16 = const()[name = tensor("op_302_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_5_cast_fp16 = mul(x = var_301_cast_fp16, y = var_302_to_fp16)[name = tensor("aw_5_cast_fp16")]; + tensor var_305_equation_0 = const()[name = tensor("op_305_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_305_cast_fp16 = einsum(equation = var_305_equation_0, values = (var_267_cast_fp16, var_244_cast_fp16))[name = tensor("op_305_cast_fp16")]; + tensor var_306_to_fp16 = const()[name = tensor("op_306_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_7_cast_fp16 = mul(x = var_305_cast_fp16, y = var_306_to_fp16)[name = tensor("aw_7_cast_fp16")]; + tensor var_309_equation_0 = const()[name = tensor("op_309_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_309_cast_fp16 = einsum(equation = var_309_equation_0, values = (var_271_cast_fp16, var_248_cast_fp16))[name = tensor("op_309_cast_fp16")]; + tensor var_310_to_fp16 = const()[name = tensor("op_310_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_9_cast_fp16 = mul(x = var_309_cast_fp16, y = var_310_to_fp16)[name = tensor("aw_9_cast_fp16")]; + tensor var_312_cast_fp16 = softmax(axis = var_112, x = aw_1_cast_fp16)[name = tensor("op_312_cast_fp16")]; + tensor var_313_cast_fp16 = softmax(axis = var_112, x = aw_3_cast_fp16)[name = tensor("op_313_cast_fp16")]; + tensor var_314_cast_fp16 = softmax(axis = var_112, x = aw_5_cast_fp16)[name = tensor("op_314_cast_fp16")]; + tensor var_315_cast_fp16 = softmax(axis = var_112, x = aw_7_cast_fp16)[name = tensor("op_315_cast_fp16")]; + tensor var_316_cast_fp16 = softmax(axis = var_112, x = aw_9_cast_fp16)[name = tensor("op_316_cast_fp16")]; + tensor var_318_equation_0 = const()[name = tensor("op_318_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_318_cast_fp16 = einsum(equation = var_318_equation_0, values = (var_273_cast_fp16, var_312_cast_fp16))[name = tensor("op_318_cast_fp16")]; + tensor var_320_equation_0 = const()[name = tensor("op_320_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_320_cast_fp16 = einsum(equation = var_320_equation_0, values = (var_277_cast_fp16, var_313_cast_fp16))[name = tensor("op_320_cast_fp16")]; + tensor var_322_equation_0 = const()[name = tensor("op_322_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_322_cast_fp16 = einsum(equation = var_322_equation_0, values = (var_281_cast_fp16, var_314_cast_fp16))[name = tensor("op_322_cast_fp16")]; + tensor var_324_equation_0 = const()[name = tensor("op_324_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_324_cast_fp16 = einsum(equation = var_324_equation_0, values = (var_285_cast_fp16, var_315_cast_fp16))[name = tensor("op_324_cast_fp16")]; + tensor var_326_equation_0 = const()[name = tensor("op_326_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_326_cast_fp16 = einsum(equation = var_326_equation_0, values = (var_289_cast_fp16, var_316_cast_fp16))[name = tensor("op_326_cast_fp16")]; + tensor input_25_interleave_0 = const()[name = tensor("input_25_interleave_0"), val = tensor(false)]; + tensor input_25_cast_fp16 = concat(axis = var_112, interleave = input_25_interleave_0, values = (var_318_cast_fp16, var_320_cast_fp16, var_322_cast_fp16, var_324_cast_fp16, var_326_cast_fp16))[name = tensor("input_25_cast_fp16")]; + tensor var_332 = const()[name = tensor("op_332"), val = tensor([1, 1])]; + tensor var_334 = const()[name = tensor("op_334"), val = tensor([1, 1])]; + tensor var_336_pad_type_0 = const()[name = tensor("op_336_pad_type_0"), val = tensor("custom")]; + tensor var_336_pad_0 = const()[name = tensor("op_336_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9460736)))]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9665600)))]; + tensor var_336_cast_fp16 = conv(bias = down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_334, groups = var_112, pad = var_336_pad_0, pad_type = var_336_pad_type_0, strides = var_332, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_25_cast_fp16)[name = tensor("op_336_cast_fp16")]; + tensor inputs_3_cast_fp16 = add(x = var_336_cast_fp16, y = inputs_1_cast_fp16)[name = tensor("inputs_3_cast_fp16")]; + tensor var_340 = const()[name = tensor("op_340"), val = tensor([1])]; + tensor channels_mean_3_cast_fp16 = reduce_mean(axes = var_340, keep_dims = var_107, x = inputs_3_cast_fp16)[name = tensor("channels_mean_3_cast_fp16")]; + tensor zero_mean_3_cast_fp16 = sub(x = inputs_3_cast_fp16, y = channels_mean_3_cast_fp16)[name = tensor("zero_mean_3_cast_fp16")]; + tensor zero_mean_sq_3_cast_fp16 = mul(x = zero_mean_3_cast_fp16, y = zero_mean_3_cast_fp16)[name = tensor("zero_mean_sq_3_cast_fp16")]; + tensor var_344 = const()[name = tensor("op_344"), val = tensor([1])]; + tensor var_345_cast_fp16 = reduce_mean(axes = var_344, keep_dims = var_107, x = zero_mean_sq_3_cast_fp16)[name = tensor("op_345_cast_fp16")]; + tensor var_346_to_fp16 = const()[name = tensor("op_346_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_347_cast_fp16 = add(x = var_345_cast_fp16, y = var_346_to_fp16)[name = tensor("op_347_cast_fp16")]; + tensor denom_3_epsilon_0_to_fp16 = const()[name = tensor("denom_3_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_3_cast_fp16 = rsqrt(epsilon = denom_3_epsilon_0_to_fp16, x = var_347_cast_fp16)[name = tensor("denom_3_cast_fp16")]; + tensor out_3_cast_fp16 = mul(x = zero_mean_3_cast_fp16, y = denom_3_cast_fp16)[name = tensor("out_3_cast_fp16")]; + tensor var_351_to_fp16 = const()[name = tensor("op_351_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9666304)))]; + tensor var_352_cast_fp16 = add(x = out_3_cast_fp16, y = var_351_to_fp16)[name = tensor("op_352_cast_fp16")]; + tensor var_354_to_fp16 = const()[name = tensor("op_354_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9667008)))]; + tensor hidden_states_11_cast_fp16 = mul(x = var_352_cast_fp16, y = var_354_to_fp16)[name = tensor("hidden_states_11_cast_fp16")]; + tensor var_361 = const()[name = tensor("op_361"), val = tensor([1, 1])]; + tensor var_363 = const()[name = tensor("op_363"), val = tensor([1, 1])]; + tensor q_3_pad_type_0 = const()[name = tensor("q_3_pad_type_0"), val = tensor("custom")]; + tensor q_3_pad_0 = const()[name = tensor("q_3_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9667712)))]; + tensor q_3_cast_fp16 = conv(dilations = var_363, groups = var_112, pad = q_3_pad_0, pad_type = q_3_pad_type_0, strides = var_361, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_11_cast_fp16)[name = tensor("q_3_cast_fp16")]; + tensor var_367 = const()[name = tensor("op_367"), val = tensor([1, 1])]; + tensor var_369 = const()[name = tensor("op_369"), val = tensor([1, 1])]; + tensor k_5_pad_type_0 = const()[name = tensor("k_5_pad_type_0"), val = tensor("custom")]; + tensor k_5_pad_0 = const()[name = tensor("k_5_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9872576)))]; + tensor k_5_cast_fp16 = conv(dilations = var_369, groups = var_112, pad = k_5_pad_0, pad_type = k_5_pad_type_0, strides = var_367, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_5_cast_fp16")]; + tensor var_373 = const()[name = tensor("op_373"), val = tensor([1, 1])]; + tensor var_375 = const()[name = tensor("op_375"), val = tensor([1, 1])]; + tensor v_3_pad_type_0 = const()[name = tensor("v_3_pad_type_0"), val = tensor("custom")]; + tensor v_3_pad_0 = const()[name = tensor("v_3_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10528000)))]; + tensor v_3_cast_fp16 = conv(dilations = var_375, groups = var_112, pad = v_3_pad_0, pad_type = v_3_pad_type_0, strides = var_373, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_3_cast_fp16")]; + tensor var_379_begin_0 = const()[name = tensor("op_379_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_379_end_0 = const()[name = tensor("op_379_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_379_end_mask_0 = const()[name = tensor("op_379_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_379_cast_fp16 = slice_by_index(begin = var_379_begin_0, end = var_379_end_0, end_mask = var_379_end_mask_0, x = q_3_cast_fp16)[name = tensor("op_379_cast_fp16")]; + tensor var_383_begin_0 = const()[name = tensor("op_383_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_383_end_0 = const()[name = tensor("op_383_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_383_end_mask_0 = const()[name = tensor("op_383_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_383_cast_fp16 = slice_by_index(begin = var_383_begin_0, end = var_383_end_0, end_mask = var_383_end_mask_0, x = q_3_cast_fp16)[name = tensor("op_383_cast_fp16")]; + tensor var_387_begin_0 = const()[name = tensor("op_387_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_387_end_0 = const()[name = tensor("op_387_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_387_end_mask_0 = const()[name = tensor("op_387_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_387_cast_fp16 = slice_by_index(begin = var_387_begin_0, end = var_387_end_0, end_mask = var_387_end_mask_0, x = q_3_cast_fp16)[name = tensor("op_387_cast_fp16")]; + tensor var_391_begin_0 = const()[name = tensor("op_391_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_391_end_0 = const()[name = tensor("op_391_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_391_end_mask_0 = const()[name = tensor("op_391_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_391_cast_fp16 = slice_by_index(begin = var_391_begin_0, end = var_391_end_0, end_mask = var_391_end_mask_0, x = q_3_cast_fp16)[name = tensor("op_391_cast_fp16")]; + tensor var_395_begin_0 = const()[name = tensor("op_395_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_395_end_0 = const()[name = tensor("op_395_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_395_end_mask_0 = const()[name = tensor("op_395_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_395_cast_fp16 = slice_by_index(begin = var_395_begin_0, end = var_395_end_0, end_mask = var_395_end_mask_0, x = q_3_cast_fp16)[name = tensor("op_395_cast_fp16")]; + tensor k_7_perm_0 = const()[name = tensor("k_7_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_402_begin_0 = const()[name = tensor("op_402_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_402_end_0 = const()[name = tensor("op_402_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_402_end_mask_0 = const()[name = tensor("op_402_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_30 = transpose(perm = k_7_perm_0, x = k_5_cast_fp16)[name = tensor("transpose_30")]; + tensor var_402_cast_fp16 = slice_by_index(begin = var_402_begin_0, end = var_402_end_0, end_mask = var_402_end_mask_0, x = transpose_30)[name = tensor("op_402_cast_fp16")]; + tensor var_406_begin_0 = const()[name = tensor("op_406_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_406_end_0 = const()[name = tensor("op_406_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_406_end_mask_0 = const()[name = tensor("op_406_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_406_cast_fp16 = slice_by_index(begin = var_406_begin_0, end = var_406_end_0, end_mask = var_406_end_mask_0, x = transpose_30)[name = tensor("op_406_cast_fp16")]; + tensor var_410_begin_0 = const()[name = tensor("op_410_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_410_end_0 = const()[name = tensor("op_410_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_410_end_mask_0 = const()[name = tensor("op_410_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_410_cast_fp16 = slice_by_index(begin = var_410_begin_0, end = var_410_end_0, end_mask = var_410_end_mask_0, x = transpose_30)[name = tensor("op_410_cast_fp16")]; + tensor var_414_begin_0 = const()[name = tensor("op_414_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_414_end_0 = const()[name = tensor("op_414_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_414_end_mask_0 = const()[name = tensor("op_414_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_414_cast_fp16 = slice_by_index(begin = var_414_begin_0, end = var_414_end_0, end_mask = var_414_end_mask_0, x = transpose_30)[name = tensor("op_414_cast_fp16")]; + tensor var_418_begin_0 = const()[name = tensor("op_418_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_418_end_0 = const()[name = tensor("op_418_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_418_end_mask_0 = const()[name = tensor("op_418_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_418_cast_fp16 = slice_by_index(begin = var_418_begin_0, end = var_418_end_0, end_mask = var_418_end_mask_0, x = transpose_30)[name = tensor("op_418_cast_fp16")]; + tensor var_420_begin_0 = const()[name = tensor("op_420_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_420_end_0 = const()[name = tensor("op_420_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_420_end_mask_0 = const()[name = tensor("op_420_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_420_cast_fp16 = slice_by_index(begin = var_420_begin_0, end = var_420_end_0, end_mask = var_420_end_mask_0, x = v_3_cast_fp16)[name = tensor("op_420_cast_fp16")]; + tensor var_424_begin_0 = const()[name = tensor("op_424_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_424_end_0 = const()[name = tensor("op_424_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_424_end_mask_0 = const()[name = tensor("op_424_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_424_cast_fp16 = slice_by_index(begin = var_424_begin_0, end = var_424_end_0, end_mask = var_424_end_mask_0, x = v_3_cast_fp16)[name = tensor("op_424_cast_fp16")]; + tensor var_428_begin_0 = const()[name = tensor("op_428_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_428_end_0 = const()[name = tensor("op_428_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_428_end_mask_0 = const()[name = tensor("op_428_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_428_cast_fp16 = slice_by_index(begin = var_428_begin_0, end = var_428_end_0, end_mask = var_428_end_mask_0, x = v_3_cast_fp16)[name = tensor("op_428_cast_fp16")]; + tensor var_432_begin_0 = const()[name = tensor("op_432_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_432_end_0 = const()[name = tensor("op_432_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_432_end_mask_0 = const()[name = tensor("op_432_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_432_cast_fp16 = slice_by_index(begin = var_432_begin_0, end = var_432_end_0, end_mask = var_432_end_mask_0, x = v_3_cast_fp16)[name = tensor("op_432_cast_fp16")]; + tensor var_436_begin_0 = const()[name = tensor("op_436_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_436_end_0 = const()[name = tensor("op_436_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_436_end_mask_0 = const()[name = tensor("op_436_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_436_cast_fp16 = slice_by_index(begin = var_436_begin_0, end = var_436_end_0, end_mask = var_436_end_mask_0, x = v_3_cast_fp16)[name = tensor("op_436_cast_fp16")]; + tensor var_440_equation_0 = const()[name = tensor("op_440_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_440_cast_fp16 = einsum(equation = var_440_equation_0, values = (var_402_cast_fp16, var_379_cast_fp16))[name = tensor("op_440_cast_fp16")]; + tensor var_441_to_fp16 = const()[name = tensor("op_441_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_11_cast_fp16 = mul(x = var_440_cast_fp16, y = var_441_to_fp16)[name = tensor("aw_11_cast_fp16")]; + tensor var_444_equation_0 = const()[name = tensor("op_444_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_444_cast_fp16 = einsum(equation = var_444_equation_0, values = (var_406_cast_fp16, var_383_cast_fp16))[name = tensor("op_444_cast_fp16")]; + tensor var_445_to_fp16 = const()[name = tensor("op_445_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_13_cast_fp16 = mul(x = var_444_cast_fp16, y = var_445_to_fp16)[name = tensor("aw_13_cast_fp16")]; + tensor var_448_equation_0 = const()[name = tensor("op_448_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_448_cast_fp16 = einsum(equation = var_448_equation_0, values = (var_410_cast_fp16, var_387_cast_fp16))[name = tensor("op_448_cast_fp16")]; + tensor var_449_to_fp16 = const()[name = tensor("op_449_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_15_cast_fp16 = mul(x = var_448_cast_fp16, y = var_449_to_fp16)[name = tensor("aw_15_cast_fp16")]; + tensor var_452_equation_0 = const()[name = tensor("op_452_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_452_cast_fp16 = einsum(equation = var_452_equation_0, values = (var_414_cast_fp16, var_391_cast_fp16))[name = tensor("op_452_cast_fp16")]; + tensor var_453_to_fp16 = const()[name = tensor("op_453_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_17_cast_fp16 = mul(x = var_452_cast_fp16, y = var_453_to_fp16)[name = tensor("aw_17_cast_fp16")]; + tensor var_456_equation_0 = const()[name = tensor("op_456_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_456_cast_fp16 = einsum(equation = var_456_equation_0, values = (var_418_cast_fp16, var_395_cast_fp16))[name = tensor("op_456_cast_fp16")]; + tensor var_457_to_fp16 = const()[name = tensor("op_457_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_19_cast_fp16 = mul(x = var_456_cast_fp16, y = var_457_to_fp16)[name = tensor("aw_19_cast_fp16")]; + tensor var_459_cast_fp16 = softmax(axis = var_112, x = aw_11_cast_fp16)[name = tensor("op_459_cast_fp16")]; + tensor var_460_cast_fp16 = softmax(axis = var_112, x = aw_13_cast_fp16)[name = tensor("op_460_cast_fp16")]; + tensor var_461_cast_fp16 = softmax(axis = var_112, x = aw_15_cast_fp16)[name = tensor("op_461_cast_fp16")]; + tensor var_462_cast_fp16 = softmax(axis = var_112, x = aw_17_cast_fp16)[name = tensor("op_462_cast_fp16")]; + tensor var_463_cast_fp16 = softmax(axis = var_112, x = aw_19_cast_fp16)[name = tensor("op_463_cast_fp16")]; + tensor var_465_equation_0 = const()[name = tensor("op_465_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_465_cast_fp16 = einsum(equation = var_465_equation_0, values = (var_420_cast_fp16, var_459_cast_fp16))[name = tensor("op_465_cast_fp16")]; + tensor var_467_equation_0 = const()[name = tensor("op_467_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_467_cast_fp16 = einsum(equation = var_467_equation_0, values = (var_424_cast_fp16, var_460_cast_fp16))[name = tensor("op_467_cast_fp16")]; + tensor var_469_equation_0 = const()[name = tensor("op_469_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_469_cast_fp16 = einsum(equation = var_469_equation_0, values = (var_428_cast_fp16, var_461_cast_fp16))[name = tensor("op_469_cast_fp16")]; + tensor var_471_equation_0 = const()[name = tensor("op_471_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_471_cast_fp16 = einsum(equation = var_471_equation_0, values = (var_432_cast_fp16, var_462_cast_fp16))[name = tensor("op_471_cast_fp16")]; + tensor var_473_equation_0 = const()[name = tensor("op_473_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_473_cast_fp16 = einsum(equation = var_473_equation_0, values = (var_436_cast_fp16, var_463_cast_fp16))[name = tensor("op_473_cast_fp16")]; + tensor input_27_interleave_0 = const()[name = tensor("input_27_interleave_0"), val = tensor(false)]; + tensor input_27_cast_fp16 = concat(axis = var_112, interleave = input_27_interleave_0, values = (var_465_cast_fp16, var_467_cast_fp16, var_469_cast_fp16, var_471_cast_fp16, var_473_cast_fp16))[name = tensor("input_27_cast_fp16")]; + tensor var_479 = const()[name = tensor("op_479"), val = tensor([1, 1])]; + tensor var_481 = const()[name = tensor("op_481"), val = tensor([1, 1])]; + tensor var_483_pad_type_0 = const()[name = tensor("op_483_pad_type_0"), val = tensor("custom")]; + tensor var_483_pad_0 = const()[name = tensor("op_483_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11183424)))]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11388288)))]; + tensor var_483_cast_fp16 = conv(bias = down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_481, groups = var_112, pad = var_483_pad_0, pad_type = var_483_pad_type_0, strides = var_479, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_27_cast_fp16)[name = tensor("op_483_cast_fp16")]; + tensor inputs_5_cast_fp16 = add(x = var_483_cast_fp16, y = inputs_3_cast_fp16)[name = tensor("inputs_5_cast_fp16")]; + tensor var_487 = const()[name = tensor("op_487"), val = tensor([1])]; + tensor channels_mean_5_cast_fp16 = reduce_mean(axes = var_487, keep_dims = var_107, x = inputs_5_cast_fp16)[name = tensor("channels_mean_5_cast_fp16")]; + tensor zero_mean_5_cast_fp16 = sub(x = inputs_5_cast_fp16, y = channels_mean_5_cast_fp16)[name = tensor("zero_mean_5_cast_fp16")]; + tensor zero_mean_sq_5_cast_fp16 = mul(x = zero_mean_5_cast_fp16, y = zero_mean_5_cast_fp16)[name = tensor("zero_mean_sq_5_cast_fp16")]; + tensor var_491 = const()[name = tensor("op_491"), val = tensor([1])]; + tensor var_492_cast_fp16 = reduce_mean(axes = var_491, keep_dims = var_107, x = zero_mean_sq_5_cast_fp16)[name = tensor("op_492_cast_fp16")]; + tensor var_493_to_fp16 = const()[name = tensor("op_493_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_494_cast_fp16 = add(x = var_492_cast_fp16, y = var_493_to_fp16)[name = tensor("op_494_cast_fp16")]; + tensor denom_5_epsilon_0_to_fp16 = const()[name = tensor("denom_5_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_5_cast_fp16 = rsqrt(epsilon = denom_5_epsilon_0_to_fp16, x = var_494_cast_fp16)[name = tensor("denom_5_cast_fp16")]; + tensor out_5_cast_fp16 = mul(x = zero_mean_5_cast_fp16, y = denom_5_cast_fp16)[name = tensor("out_5_cast_fp16")]; + tensor var_498_to_fp16 = const()[name = tensor("op_498_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11388992)))]; + tensor var_499_cast_fp16 = add(x = out_5_cast_fp16, y = var_498_to_fp16)[name = tensor("op_499_cast_fp16")]; + tensor var_501_to_fp16 = const()[name = tensor("op_501_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11389696)))]; + tensor input_29_cast_fp16 = mul(x = var_499_cast_fp16, y = var_501_to_fp16)[name = tensor("input_29_cast_fp16")]; + tensor var_509 = const()[name = tensor("op_509"), val = tensor([1, 1])]; + tensor var_511 = const()[name = tensor("op_511"), val = tensor([1, 1])]; + tensor var_513_pad_type_0 = const()[name = tensor("op_513_pad_type_0"), val = tensor("custom")]; + tensor var_513_pad_0 = const()[name = tensor("op_513_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11390400)))]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13028864)))]; + tensor var_513_cast_fp16 = conv(bias = down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_511, groups = var_112, pad = var_513_pad_0, pad_type = var_513_pad_type_0, strides = var_509, weight = down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_29_cast_fp16)[name = tensor("op_513_cast_fp16")]; + tensor var_514_split_sizes_0 = const()[name = tensor("op_514_split_sizes_0"), val = tensor([1280, 1280])]; + tensor var_514_axis_0 = const()[name = tensor("op_514_axis_0"), val = tensor(1)]; + tensor var_514_cast_fp16_0, tensor var_514_cast_fp16_1 = split(axis = var_514_axis_0, split_sizes = var_514_split_sizes_0, x = var_513_cast_fp16)[name = tensor("op_514_cast_fp16")]; + tensor var_516_mode_0 = const()[name = tensor("op_516_mode_0"), val = tensor("EXACT")]; + tensor var_516_cast_fp16 = gelu(mode = var_516_mode_0, x = var_514_cast_fp16_1)[name = tensor("op_516_cast_fp16")]; + tensor input_31_cast_fp16 = mul(x = var_514_cast_fp16_0, y = var_516_cast_fp16)[name = tensor("input_31_cast_fp16")]; + tensor var_520 = const()[name = tensor("op_520"), val = tensor([1, 1])]; + tensor var_522 = const()[name = tensor("op_522"), val = tensor([1, 1])]; + tensor var_524_pad_type_0 = const()[name = tensor("op_524_pad_type_0"), val = tensor("custom")]; + tensor var_524_pad_0 = const()[name = tensor("op_524_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13034048)))]; + tensor down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13853312)))]; + tensor var_524_cast_fp16 = conv(bias = down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_522, groups = var_112, pad = var_524_pad_0, pad_type = var_524_pad_type_0, strides = var_520, weight = down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_31_cast_fp16)[name = tensor("op_524_cast_fp16")]; + tensor hidden_states_15_cast_fp16 = add(x = var_524_cast_fp16, y = inputs_5_cast_fp16)[name = tensor("hidden_states_15_cast_fp16")]; + tensor var_526 = const()[name = tensor("op_526"), val = tensor([2, 320, 48, 48])]; + tensor input_33_cast_fp16 = reshape(shape = var_526, x = hidden_states_15_cast_fp16)[name = tensor("input_33_cast_fp16")]; + tensor var_530 = const()[name = tensor("op_530"), val = tensor([1, 1])]; + tensor var_532 = const()[name = tensor("op_532"), val = tensor([1, 1])]; + tensor hidden_states_17_pad_type_0 = const()[name = tensor("hidden_states_17_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_17_pad_0 = const()[name = tensor("hidden_states_17_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_0_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13854016)))]; + tensor down_blocks_0_attentions_0_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14058880)))]; + tensor hidden_states_17_cast_fp16 = conv(bias = down_blocks_0_attentions_0_proj_out_bias_to_fp16, dilations = var_532, groups = var_112, pad = hidden_states_17_pad_0, pad_type = hidden_states_17_pad_type_0, strides = var_530, weight = down_blocks_0_attentions_0_proj_out_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("hidden_states_17_cast_fp16")]; + tensor input_35_cast_fp16 = add(x = hidden_states_17_cast_fp16, y = hidden_states_5_cast_fp16)[name = tensor("input_35_cast_fp16")]; + tensor reshape_12_shape_0 = const()[name = tensor("reshape_12_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_12_cast_fp16 = reshape(shape = reshape_12_shape_0, x = input_35_cast_fp16)[name = tensor("reshape_12_cast_fp16")]; + tensor reduce_mean_9_axes_0 = const()[name = tensor("reduce_mean_9_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_9_keep_dims_0 = const()[name = tensor("reduce_mean_9_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_9_cast_fp16 = reduce_mean(axes = reduce_mean_9_axes_0, keep_dims = reduce_mean_9_keep_dims_0, x = reshape_12_cast_fp16)[name = tensor("reduce_mean_9_cast_fp16")]; + tensor sub_6_cast_fp16 = sub(x = reshape_12_cast_fp16, y = reduce_mean_9_cast_fp16)[name = tensor("sub_6_cast_fp16")]; + tensor square_3_cast_fp16 = square(x = sub_6_cast_fp16)[name = tensor("square_3_cast_fp16")]; + tensor reduce_mean_11_axes_0 = const()[name = tensor("reduce_mean_11_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_11_keep_dims_0 = const()[name = tensor("reduce_mean_11_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_11_cast_fp16 = reduce_mean(axes = reduce_mean_11_axes_0, keep_dims = reduce_mean_11_keep_dims_0, x = square_3_cast_fp16)[name = tensor("reduce_mean_11_cast_fp16")]; + tensor add_6_y_0_to_fp16 = const()[name = tensor("add_6_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_6_cast_fp16 = add(x = reduce_mean_11_cast_fp16, y = add_6_y_0_to_fp16)[name = tensor("add_6_cast_fp16")]; + tensor sqrt_3_cast_fp16 = sqrt(x = add_6_cast_fp16)[name = tensor("sqrt_3_cast_fp16")]; + tensor real_div_3_cast_fp16 = real_div(x = sub_6_cast_fp16, y = sqrt_3_cast_fp16)[name = tensor("real_div_3_cast_fp16")]; + tensor reshape_13_shape_0 = const()[name = tensor("reshape_13_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_13_cast_fp16 = reshape(shape = reshape_13_shape_0, x = real_div_3_cast_fp16)[name = tensor("reshape_13_cast_fp16")]; + tensor add_7_gamma_0_to_fp16 = const()[name = tensor("add_7_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14059584)))]; + tensor add_7_beta_0_to_fp16 = const()[name = tensor("add_7_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14060288)))]; + tensor add_7_epsilon_0_to_fp16 = const()[name = tensor("add_7_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_7_cast_fp16 = batch_norm(beta = add_7_beta_0_to_fp16, epsilon = add_7_epsilon_0_to_fp16, gamma = add_7_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_13_cast_fp16)[name = tensor("add_7_cast_fp16")]; + tensor input_39_cast_fp16 = silu(x = add_7_cast_fp16)[name = tensor("input_39_cast_fp16")]; + tensor var_547 = const()[name = tensor("op_547"), val = tensor([1, 1])]; + tensor var_549 = const()[name = tensor("op_549"), val = tensor([1, 1])]; + tensor hidden_states_19_pad_type_0 = const()[name = tensor("hidden_states_19_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_19_pad_0 = const()[name = tensor("hidden_states_19_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_0_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14060992)))]; + tensor down_blocks_0_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15904256)))]; + tensor hidden_states_19_cast_fp16 = conv(bias = down_blocks_0_resnets_1_conv1_bias_to_fp16, dilations = var_549, groups = var_112, pad = hidden_states_19_pad_0, pad_type = hidden_states_19_pad_type_0, strides = var_547, weight = down_blocks_0_resnets_1_conv1_weight_to_fp16, x = input_39_cast_fp16)[name = tensor("hidden_states_19_cast_fp16")]; + tensor var_555 = const()[name = tensor("op_555"), val = tensor([1, 1])]; + tensor var_557 = const()[name = tensor("op_557"), val = tensor([1, 1])]; + tensor temb_3_pad_type_0 = const()[name = tensor("temb_3_pad_type_0"), val = tensor("custom")]; + tensor temb_3_pad_0 = const()[name = tensor("temb_3_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15904960)))]; + tensor down_blocks_0_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16724224)))]; + tensor temb_3_cast_fp16 = conv(bias = down_blocks_0_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_557, groups = var_112, pad = temb_3_pad_0, pad_type = temb_3_pad_type_0, strides = var_555, weight = down_blocks_0_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_3_cast_fp16")]; + tensor input_43_cast_fp16 = add(x = hidden_states_19_cast_fp16, y = temb_3_cast_fp16)[name = tensor("input_43_cast_fp16")]; + tensor reshape_16_shape_0 = const()[name = tensor("reshape_16_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_16_cast_fp16 = reshape(shape = reshape_16_shape_0, x = input_43_cast_fp16)[name = tensor("reshape_16_cast_fp16")]; + tensor reduce_mean_12_axes_0 = const()[name = tensor("reduce_mean_12_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_12_keep_dims_0 = const()[name = tensor("reduce_mean_12_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_12_cast_fp16 = reduce_mean(axes = reduce_mean_12_axes_0, keep_dims = reduce_mean_12_keep_dims_0, x = reshape_16_cast_fp16)[name = tensor("reduce_mean_12_cast_fp16")]; + tensor sub_8_cast_fp16 = sub(x = reshape_16_cast_fp16, y = reduce_mean_12_cast_fp16)[name = tensor("sub_8_cast_fp16")]; + tensor square_4_cast_fp16 = square(x = sub_8_cast_fp16)[name = tensor("square_4_cast_fp16")]; + tensor reduce_mean_14_axes_0 = const()[name = tensor("reduce_mean_14_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_14_keep_dims_0 = const()[name = tensor("reduce_mean_14_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_14_cast_fp16 = reduce_mean(axes = reduce_mean_14_axes_0, keep_dims = reduce_mean_14_keep_dims_0, x = square_4_cast_fp16)[name = tensor("reduce_mean_14_cast_fp16")]; + tensor add_8_y_0_to_fp16 = const()[name = tensor("add_8_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_8_cast_fp16 = add(x = reduce_mean_14_cast_fp16, y = add_8_y_0_to_fp16)[name = tensor("add_8_cast_fp16")]; + tensor sqrt_4_cast_fp16 = sqrt(x = add_8_cast_fp16)[name = tensor("sqrt_4_cast_fp16")]; + tensor real_div_4_cast_fp16 = real_div(x = sub_8_cast_fp16, y = sqrt_4_cast_fp16)[name = tensor("real_div_4_cast_fp16")]; + tensor reshape_17_shape_0 = const()[name = tensor("reshape_17_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_17_cast_fp16 = reshape(shape = reshape_17_shape_0, x = real_div_4_cast_fp16)[name = tensor("reshape_17_cast_fp16")]; + tensor add_9_gamma_0_to_fp16 = const()[name = tensor("add_9_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16724928)))]; + tensor add_9_beta_0_to_fp16 = const()[name = tensor("add_9_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16725632)))]; + tensor add_9_epsilon_0_to_fp16 = const()[name = tensor("add_9_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_9_cast_fp16 = batch_norm(beta = add_9_beta_0_to_fp16, epsilon = add_9_epsilon_0_to_fp16, gamma = add_9_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_17_cast_fp16)[name = tensor("add_9_cast_fp16")]; + tensor input_47_cast_fp16 = silu(x = add_9_cast_fp16)[name = tensor("input_47_cast_fp16")]; + tensor var_567 = const()[name = tensor("op_567"), val = tensor([1, 1])]; + tensor var_569 = const()[name = tensor("op_569"), val = tensor([1, 1])]; + tensor hidden_states_21_pad_type_0 = const()[name = tensor("hidden_states_21_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_21_pad_0 = const()[name = tensor("hidden_states_21_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_0_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16726336)))]; + tensor down_blocks_0_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18569600)))]; + tensor hidden_states_21_cast_fp16 = conv(bias = down_blocks_0_resnets_1_conv2_bias_to_fp16, dilations = var_569, groups = var_112, pad = hidden_states_21_pad_0, pad_type = hidden_states_21_pad_type_0, strides = var_567, weight = down_blocks_0_resnets_1_conv2_weight_to_fp16, x = input_47_cast_fp16)[name = tensor("hidden_states_21_cast_fp16")]; + tensor hidden_states_23_cast_fp16 = add(x = input_35_cast_fp16, y = hidden_states_21_cast_fp16)[name = tensor("hidden_states_23_cast_fp16")]; + tensor reshape_20_shape_0 = const()[name = tensor("reshape_20_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_20_cast_fp16 = reshape(shape = reshape_20_shape_0, x = hidden_states_23_cast_fp16)[name = tensor("reshape_20_cast_fp16")]; + tensor reduce_mean_15_axes_0 = const()[name = tensor("reduce_mean_15_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_15_keep_dims_0 = const()[name = tensor("reduce_mean_15_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_15_cast_fp16 = reduce_mean(axes = reduce_mean_15_axes_0, keep_dims = reduce_mean_15_keep_dims_0, x = reshape_20_cast_fp16)[name = tensor("reduce_mean_15_cast_fp16")]; + tensor sub_10_cast_fp16 = sub(x = reshape_20_cast_fp16, y = reduce_mean_15_cast_fp16)[name = tensor("sub_10_cast_fp16")]; + tensor square_5_cast_fp16 = square(x = sub_10_cast_fp16)[name = tensor("square_5_cast_fp16")]; + tensor reduce_mean_17_axes_0 = const()[name = tensor("reduce_mean_17_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_17_keep_dims_0 = const()[name = tensor("reduce_mean_17_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_17_cast_fp16 = reduce_mean(axes = reduce_mean_17_axes_0, keep_dims = reduce_mean_17_keep_dims_0, x = square_5_cast_fp16)[name = tensor("reduce_mean_17_cast_fp16")]; + tensor add_10_y_0_to_fp16 = const()[name = tensor("add_10_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_10_cast_fp16 = add(x = reduce_mean_17_cast_fp16, y = add_10_y_0_to_fp16)[name = tensor("add_10_cast_fp16")]; + tensor sqrt_5_cast_fp16 = sqrt(x = add_10_cast_fp16)[name = tensor("sqrt_5_cast_fp16")]; + tensor real_div_5_cast_fp16 = real_div(x = sub_10_cast_fp16, y = sqrt_5_cast_fp16)[name = tensor("real_div_5_cast_fp16")]; + tensor reshape_21_shape_0 = const()[name = tensor("reshape_21_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_21_cast_fp16 = reshape(shape = reshape_21_shape_0, x = real_div_5_cast_fp16)[name = tensor("reshape_21_cast_fp16")]; + tensor add_11_gamma_0_to_fp16 = const()[name = tensor("add_11_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18570304)))]; + tensor add_11_beta_0_to_fp16 = const()[name = tensor("add_11_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18571008)))]; + tensor add_11_epsilon_0_to_fp16 = const()[name = tensor("add_11_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_11_cast_fp16 = batch_norm(beta = add_11_beta_0_to_fp16, epsilon = add_11_epsilon_0_to_fp16, gamma = add_11_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_21_cast_fp16)[name = tensor("add_11_cast_fp16")]; + tensor var_589 = const()[name = tensor("op_589"), val = tensor([1, 1])]; + tensor var_591 = const()[name = tensor("op_591"), val = tensor([1, 1])]; + tensor hidden_states_25_pad_type_0 = const()[name = tensor("hidden_states_25_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_25_pad_0 = const()[name = tensor("hidden_states_25_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18571712)))]; + tensor down_blocks_0_attentions_1_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18776576)))]; + tensor hidden_states_25_cast_fp16 = conv(bias = down_blocks_0_attentions_1_proj_in_bias_to_fp16, dilations = var_591, groups = var_112, pad = hidden_states_25_pad_0, pad_type = hidden_states_25_pad_type_0, strides = var_589, weight = down_blocks_0_attentions_1_proj_in_weight_to_fp16, x = add_11_cast_fp16)[name = tensor("hidden_states_25_cast_fp16")]; + tensor var_596 = const()[name = tensor("op_596"), val = tensor([2, 320, 1, 2304])]; + tensor inputs_7_cast_fp16 = reshape(shape = var_596, x = hidden_states_25_cast_fp16)[name = tensor("inputs_7_cast_fp16")]; + tensor var_606 = const()[name = tensor("op_606"), val = tensor([1])]; + tensor channels_mean_7_cast_fp16 = reduce_mean(axes = var_606, keep_dims = var_107, x = inputs_7_cast_fp16)[name = tensor("channels_mean_7_cast_fp16")]; + tensor zero_mean_7_cast_fp16 = sub(x = inputs_7_cast_fp16, y = channels_mean_7_cast_fp16)[name = tensor("zero_mean_7_cast_fp16")]; + tensor zero_mean_sq_7_cast_fp16 = mul(x = zero_mean_7_cast_fp16, y = zero_mean_7_cast_fp16)[name = tensor("zero_mean_sq_7_cast_fp16")]; + tensor var_610 = const()[name = tensor("op_610"), val = tensor([1])]; + tensor var_611_cast_fp16 = reduce_mean(axes = var_610, keep_dims = var_107, x = zero_mean_sq_7_cast_fp16)[name = tensor("op_611_cast_fp16")]; + tensor var_612_to_fp16 = const()[name = tensor("op_612_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_613_cast_fp16 = add(x = var_611_cast_fp16, y = var_612_to_fp16)[name = tensor("op_613_cast_fp16")]; + tensor denom_7_epsilon_0_to_fp16 = const()[name = tensor("denom_7_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_7_cast_fp16 = rsqrt(epsilon = denom_7_epsilon_0_to_fp16, x = var_613_cast_fp16)[name = tensor("denom_7_cast_fp16")]; + tensor out_7_cast_fp16 = mul(x = zero_mean_7_cast_fp16, y = denom_7_cast_fp16)[name = tensor("out_7_cast_fp16")]; + tensor var_617_to_fp16 = const()[name = tensor("op_617_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18777280)))]; + tensor var_618_cast_fp16 = add(x = out_7_cast_fp16, y = var_617_to_fp16)[name = tensor("op_618_cast_fp16")]; + tensor var_620_to_fp16 = const()[name = tensor("op_620_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18777984)))]; + tensor hidden_states_27_cast_fp16 = mul(x = var_618_cast_fp16, y = var_620_to_fp16)[name = tensor("hidden_states_27_cast_fp16")]; + tensor var_627 = const()[name = tensor("op_627"), val = tensor([1, 1])]; + tensor var_629 = const()[name = tensor("op_629"), val = tensor([1, 1])]; + tensor q_5_pad_type_0 = const()[name = tensor("q_5_pad_type_0"), val = tensor("custom")]; + tensor q_5_pad_0 = const()[name = tensor("q_5_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18778688)))]; + tensor q_5_cast_fp16 = conv(dilations = var_629, groups = var_112, pad = q_5_pad_0, pad_type = q_5_pad_type_0, strides = var_627, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor("q_5_cast_fp16")]; + tensor var_633 = const()[name = tensor("op_633"), val = tensor([1, 1])]; + tensor var_635 = const()[name = tensor("op_635"), val = tensor([1, 1])]; + tensor k_9_pad_type_0 = const()[name = tensor("k_9_pad_type_0"), val = tensor("custom")]; + tensor k_9_pad_0 = const()[name = tensor("k_9_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18983552)))]; + tensor k_9_cast_fp16 = conv(dilations = var_635, groups = var_112, pad = k_9_pad_0, pad_type = k_9_pad_type_0, strides = var_633, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor("k_9_cast_fp16")]; + tensor var_639 = const()[name = tensor("op_639"), val = tensor([1, 1])]; + tensor var_641 = const()[name = tensor("op_641"), val = tensor([1, 1])]; + tensor v_5_pad_type_0 = const()[name = tensor("v_5_pad_type_0"), val = tensor("custom")]; + tensor v_5_pad_0 = const()[name = tensor("v_5_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19188416)))]; + tensor v_5_cast_fp16 = conv(dilations = var_641, groups = var_112, pad = v_5_pad_0, pad_type = v_5_pad_type_0, strides = var_639, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor("v_5_cast_fp16")]; + tensor var_645_begin_0 = const()[name = tensor("op_645_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_645_end_0 = const()[name = tensor("op_645_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_645_end_mask_0 = const()[name = tensor("op_645_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_645_cast_fp16 = slice_by_index(begin = var_645_begin_0, end = var_645_end_0, end_mask = var_645_end_mask_0, x = q_5_cast_fp16)[name = tensor("op_645_cast_fp16")]; + tensor var_649_begin_0 = const()[name = tensor("op_649_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_649_end_0 = const()[name = tensor("op_649_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_649_end_mask_0 = const()[name = tensor("op_649_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_649_cast_fp16 = slice_by_index(begin = var_649_begin_0, end = var_649_end_0, end_mask = var_649_end_mask_0, x = q_5_cast_fp16)[name = tensor("op_649_cast_fp16")]; + tensor var_653_begin_0 = const()[name = tensor("op_653_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_653_end_0 = const()[name = tensor("op_653_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_653_end_mask_0 = const()[name = tensor("op_653_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_653_cast_fp16 = slice_by_index(begin = var_653_begin_0, end = var_653_end_0, end_mask = var_653_end_mask_0, x = q_5_cast_fp16)[name = tensor("op_653_cast_fp16")]; + tensor var_657_begin_0 = const()[name = tensor("op_657_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_657_end_0 = const()[name = tensor("op_657_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_657_end_mask_0 = const()[name = tensor("op_657_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_657_cast_fp16 = slice_by_index(begin = var_657_begin_0, end = var_657_end_0, end_mask = var_657_end_mask_0, x = q_5_cast_fp16)[name = tensor("op_657_cast_fp16")]; + tensor var_661_begin_0 = const()[name = tensor("op_661_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_661_end_0 = const()[name = tensor("op_661_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_661_end_mask_0 = const()[name = tensor("op_661_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_661_cast_fp16 = slice_by_index(begin = var_661_begin_0, end = var_661_end_0, end_mask = var_661_end_mask_0, x = q_5_cast_fp16)[name = tensor("op_661_cast_fp16")]; + tensor k_11_perm_0 = const()[name = tensor("k_11_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_668_begin_0 = const()[name = tensor("op_668_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_668_end_0 = const()[name = tensor("op_668_end_0"), val = tensor([2, 2304, 1, 64])]; + tensor var_668_end_mask_0 = const()[name = tensor("op_668_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_29 = transpose(perm = k_11_perm_0, x = k_9_cast_fp16)[name = tensor("transpose_29")]; + tensor var_668_cast_fp16 = slice_by_index(begin = var_668_begin_0, end = var_668_end_0, end_mask = var_668_end_mask_0, x = transpose_29)[name = tensor("op_668_cast_fp16")]; + tensor var_672_begin_0 = const()[name = tensor("op_672_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_672_end_0 = const()[name = tensor("op_672_end_0"), val = tensor([2, 2304, 1, 128])]; + tensor var_672_end_mask_0 = const()[name = tensor("op_672_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_672_cast_fp16 = slice_by_index(begin = var_672_begin_0, end = var_672_end_0, end_mask = var_672_end_mask_0, x = transpose_29)[name = tensor("op_672_cast_fp16")]; + tensor var_676_begin_0 = const()[name = tensor("op_676_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_676_end_0 = const()[name = tensor("op_676_end_0"), val = tensor([2, 2304, 1, 192])]; + tensor var_676_end_mask_0 = const()[name = tensor("op_676_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_676_cast_fp16 = slice_by_index(begin = var_676_begin_0, end = var_676_end_0, end_mask = var_676_end_mask_0, x = transpose_29)[name = tensor("op_676_cast_fp16")]; + tensor var_680_begin_0 = const()[name = tensor("op_680_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_680_end_0 = const()[name = tensor("op_680_end_0"), val = tensor([2, 2304, 1, 256])]; + tensor var_680_end_mask_0 = const()[name = tensor("op_680_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_680_cast_fp16 = slice_by_index(begin = var_680_begin_0, end = var_680_end_0, end_mask = var_680_end_mask_0, x = transpose_29)[name = tensor("op_680_cast_fp16")]; + tensor var_684_begin_0 = const()[name = tensor("op_684_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_684_end_0 = const()[name = tensor("op_684_end_0"), val = tensor([2, 2304, 1, 320])]; + tensor var_684_end_mask_0 = const()[name = tensor("op_684_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_684_cast_fp16 = slice_by_index(begin = var_684_begin_0, end = var_684_end_0, end_mask = var_684_end_mask_0, x = transpose_29)[name = tensor("op_684_cast_fp16")]; + tensor var_686_begin_0 = const()[name = tensor("op_686_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_686_end_0 = const()[name = tensor("op_686_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_686_end_mask_0 = const()[name = tensor("op_686_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_686_cast_fp16 = slice_by_index(begin = var_686_begin_0, end = var_686_end_0, end_mask = var_686_end_mask_0, x = v_5_cast_fp16)[name = tensor("op_686_cast_fp16")]; + tensor var_690_begin_0 = const()[name = tensor("op_690_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_690_end_0 = const()[name = tensor("op_690_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_690_end_mask_0 = const()[name = tensor("op_690_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_690_cast_fp16 = slice_by_index(begin = var_690_begin_0, end = var_690_end_0, end_mask = var_690_end_mask_0, x = v_5_cast_fp16)[name = tensor("op_690_cast_fp16")]; + tensor var_694_begin_0 = const()[name = tensor("op_694_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_694_end_0 = const()[name = tensor("op_694_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_694_end_mask_0 = const()[name = tensor("op_694_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_694_cast_fp16 = slice_by_index(begin = var_694_begin_0, end = var_694_end_0, end_mask = var_694_end_mask_0, x = v_5_cast_fp16)[name = tensor("op_694_cast_fp16")]; + tensor var_698_begin_0 = const()[name = tensor("op_698_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_698_end_0 = const()[name = tensor("op_698_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_698_end_mask_0 = const()[name = tensor("op_698_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_698_cast_fp16 = slice_by_index(begin = var_698_begin_0, end = var_698_end_0, end_mask = var_698_end_mask_0, x = v_5_cast_fp16)[name = tensor("op_698_cast_fp16")]; + tensor var_702_begin_0 = const()[name = tensor("op_702_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_702_end_0 = const()[name = tensor("op_702_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_702_end_mask_0 = const()[name = tensor("op_702_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_702_cast_fp16 = slice_by_index(begin = var_702_begin_0, end = var_702_end_0, end_mask = var_702_end_mask_0, x = v_5_cast_fp16)[name = tensor("op_702_cast_fp16")]; + tensor var_706_equation_0 = const()[name = tensor("op_706_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_706_cast_fp16 = einsum(equation = var_706_equation_0, values = (var_668_cast_fp16, var_645_cast_fp16))[name = tensor("op_706_cast_fp16")]; + tensor var_707_to_fp16 = const()[name = tensor("op_707_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_21_cast_fp16 = mul(x = var_706_cast_fp16, y = var_707_to_fp16)[name = tensor("aw_21_cast_fp16")]; + tensor var_710_equation_0 = const()[name = tensor("op_710_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_710_cast_fp16 = einsum(equation = var_710_equation_0, values = (var_672_cast_fp16, var_649_cast_fp16))[name = tensor("op_710_cast_fp16")]; + tensor var_711_to_fp16 = const()[name = tensor("op_711_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_23_cast_fp16 = mul(x = var_710_cast_fp16, y = var_711_to_fp16)[name = tensor("aw_23_cast_fp16")]; + tensor var_714_equation_0 = const()[name = tensor("op_714_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_714_cast_fp16 = einsum(equation = var_714_equation_0, values = (var_676_cast_fp16, var_653_cast_fp16))[name = tensor("op_714_cast_fp16")]; + tensor var_715_to_fp16 = const()[name = tensor("op_715_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_25_cast_fp16 = mul(x = var_714_cast_fp16, y = var_715_to_fp16)[name = tensor("aw_25_cast_fp16")]; + tensor var_718_equation_0 = const()[name = tensor("op_718_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_718_cast_fp16 = einsum(equation = var_718_equation_0, values = (var_680_cast_fp16, var_657_cast_fp16))[name = tensor("op_718_cast_fp16")]; + tensor var_719_to_fp16 = const()[name = tensor("op_719_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_27_cast_fp16 = mul(x = var_718_cast_fp16, y = var_719_to_fp16)[name = tensor("aw_27_cast_fp16")]; + tensor var_722_equation_0 = const()[name = tensor("op_722_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_722_cast_fp16 = einsum(equation = var_722_equation_0, values = (var_684_cast_fp16, var_661_cast_fp16))[name = tensor("op_722_cast_fp16")]; + tensor var_723_to_fp16 = const()[name = tensor("op_723_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_29_cast_fp16 = mul(x = var_722_cast_fp16, y = var_723_to_fp16)[name = tensor("aw_29_cast_fp16")]; + tensor var_725_cast_fp16 = softmax(axis = var_112, x = aw_21_cast_fp16)[name = tensor("op_725_cast_fp16")]; + tensor var_726_cast_fp16 = softmax(axis = var_112, x = aw_23_cast_fp16)[name = tensor("op_726_cast_fp16")]; + tensor var_727_cast_fp16 = softmax(axis = var_112, x = aw_25_cast_fp16)[name = tensor("op_727_cast_fp16")]; + tensor var_728_cast_fp16 = softmax(axis = var_112, x = aw_27_cast_fp16)[name = tensor("op_728_cast_fp16")]; + tensor var_729_cast_fp16 = softmax(axis = var_112, x = aw_29_cast_fp16)[name = tensor("op_729_cast_fp16")]; + tensor var_731_equation_0 = const()[name = tensor("op_731_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_731_cast_fp16 = einsum(equation = var_731_equation_0, values = (var_686_cast_fp16, var_725_cast_fp16))[name = tensor("op_731_cast_fp16")]; + tensor var_733_equation_0 = const()[name = tensor("op_733_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_733_cast_fp16 = einsum(equation = var_733_equation_0, values = (var_690_cast_fp16, var_726_cast_fp16))[name = tensor("op_733_cast_fp16")]; + tensor var_735_equation_0 = const()[name = tensor("op_735_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_735_cast_fp16 = einsum(equation = var_735_equation_0, values = (var_694_cast_fp16, var_727_cast_fp16))[name = tensor("op_735_cast_fp16")]; + tensor var_737_equation_0 = const()[name = tensor("op_737_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_737_cast_fp16 = einsum(equation = var_737_equation_0, values = (var_698_cast_fp16, var_728_cast_fp16))[name = tensor("op_737_cast_fp16")]; + tensor var_739_equation_0 = const()[name = tensor("op_739_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_739_cast_fp16 = einsum(equation = var_739_equation_0, values = (var_702_cast_fp16, var_729_cast_fp16))[name = tensor("op_739_cast_fp16")]; + tensor input_51_interleave_0 = const()[name = tensor("input_51_interleave_0"), val = tensor(false)]; + tensor input_51_cast_fp16 = concat(axis = var_112, interleave = input_51_interleave_0, values = (var_731_cast_fp16, var_733_cast_fp16, var_735_cast_fp16, var_737_cast_fp16, var_739_cast_fp16))[name = tensor("input_51_cast_fp16")]; + tensor var_745 = const()[name = tensor("op_745"), val = tensor([1, 1])]; + tensor var_747 = const()[name = tensor("op_747"), val = tensor([1, 1])]; + tensor var_749_pad_type_0 = const()[name = tensor("op_749_pad_type_0"), val = tensor("custom")]; + tensor var_749_pad_0 = const()[name = tensor("op_749_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19393280)))]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19598144)))]; + tensor var_749_cast_fp16 = conv(bias = down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_747, groups = var_112, pad = var_749_pad_0, pad_type = var_749_pad_type_0, strides = var_745, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_51_cast_fp16)[name = tensor("op_749_cast_fp16")]; + tensor inputs_9_cast_fp16 = add(x = var_749_cast_fp16, y = inputs_7_cast_fp16)[name = tensor("inputs_9_cast_fp16")]; + tensor var_753 = const()[name = tensor("op_753"), val = tensor([1])]; + tensor channels_mean_9_cast_fp16 = reduce_mean(axes = var_753, keep_dims = var_107, x = inputs_9_cast_fp16)[name = tensor("channels_mean_9_cast_fp16")]; + tensor zero_mean_9_cast_fp16 = sub(x = inputs_9_cast_fp16, y = channels_mean_9_cast_fp16)[name = tensor("zero_mean_9_cast_fp16")]; + tensor zero_mean_sq_9_cast_fp16 = mul(x = zero_mean_9_cast_fp16, y = zero_mean_9_cast_fp16)[name = tensor("zero_mean_sq_9_cast_fp16")]; + tensor var_757 = const()[name = tensor("op_757"), val = tensor([1])]; + tensor var_758_cast_fp16 = reduce_mean(axes = var_757, keep_dims = var_107, x = zero_mean_sq_9_cast_fp16)[name = tensor("op_758_cast_fp16")]; + tensor var_759_to_fp16 = const()[name = tensor("op_759_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_760_cast_fp16 = add(x = var_758_cast_fp16, y = var_759_to_fp16)[name = tensor("op_760_cast_fp16")]; + tensor denom_9_epsilon_0_to_fp16 = const()[name = tensor("denom_9_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_9_cast_fp16 = rsqrt(epsilon = denom_9_epsilon_0_to_fp16, x = var_760_cast_fp16)[name = tensor("denom_9_cast_fp16")]; + tensor out_9_cast_fp16 = mul(x = zero_mean_9_cast_fp16, y = denom_9_cast_fp16)[name = tensor("out_9_cast_fp16")]; + tensor var_764_to_fp16 = const()[name = tensor("op_764_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19598848)))]; + tensor var_765_cast_fp16 = add(x = out_9_cast_fp16, y = var_764_to_fp16)[name = tensor("op_765_cast_fp16")]; + tensor var_767_to_fp16 = const()[name = tensor("op_767_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19599552)))]; + tensor hidden_states_29_cast_fp16 = mul(x = var_765_cast_fp16, y = var_767_to_fp16)[name = tensor("hidden_states_29_cast_fp16")]; + tensor var_774 = const()[name = tensor("op_774"), val = tensor([1, 1])]; + tensor var_776 = const()[name = tensor("op_776"), val = tensor([1, 1])]; + tensor q_7_pad_type_0 = const()[name = tensor("q_7_pad_type_0"), val = tensor("custom")]; + tensor q_7_pad_0 = const()[name = tensor("q_7_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19600256)))]; + tensor q_7_cast_fp16 = conv(dilations = var_776, groups = var_112, pad = q_7_pad_0, pad_type = q_7_pad_type_0, strides = var_774, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_29_cast_fp16)[name = tensor("q_7_cast_fp16")]; + tensor var_780 = const()[name = tensor("op_780"), val = tensor([1, 1])]; + tensor var_782 = const()[name = tensor("op_782"), val = tensor([1, 1])]; + tensor k_13_pad_type_0 = const()[name = tensor("k_13_pad_type_0"), val = tensor("custom")]; + tensor k_13_pad_0 = const()[name = tensor("k_13_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19805120)))]; + tensor k_13_cast_fp16 = conv(dilations = var_782, groups = var_112, pad = k_13_pad_0, pad_type = k_13_pad_type_0, strides = var_780, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_13_cast_fp16")]; + tensor var_786 = const()[name = tensor("op_786"), val = tensor([1, 1])]; + tensor var_788 = const()[name = tensor("op_788"), val = tensor([1, 1])]; + tensor v_7_pad_type_0 = const()[name = tensor("v_7_pad_type_0"), val = tensor("custom")]; + tensor v_7_pad_0 = const()[name = tensor("v_7_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20460544)))]; + tensor v_7_cast_fp16 = conv(dilations = var_788, groups = var_112, pad = v_7_pad_0, pad_type = v_7_pad_type_0, strides = var_786, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_7_cast_fp16")]; + tensor var_792_begin_0 = const()[name = tensor("op_792_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_792_end_0 = const()[name = tensor("op_792_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_792_end_mask_0 = const()[name = tensor("op_792_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_792_cast_fp16 = slice_by_index(begin = var_792_begin_0, end = var_792_end_0, end_mask = var_792_end_mask_0, x = q_7_cast_fp16)[name = tensor("op_792_cast_fp16")]; + tensor var_796_begin_0 = const()[name = tensor("op_796_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_796_end_0 = const()[name = tensor("op_796_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_796_end_mask_0 = const()[name = tensor("op_796_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_796_cast_fp16 = slice_by_index(begin = var_796_begin_0, end = var_796_end_0, end_mask = var_796_end_mask_0, x = q_7_cast_fp16)[name = tensor("op_796_cast_fp16")]; + tensor var_800_begin_0 = const()[name = tensor("op_800_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_800_end_0 = const()[name = tensor("op_800_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_800_end_mask_0 = const()[name = tensor("op_800_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_800_cast_fp16 = slice_by_index(begin = var_800_begin_0, end = var_800_end_0, end_mask = var_800_end_mask_0, x = q_7_cast_fp16)[name = tensor("op_800_cast_fp16")]; + tensor var_804_begin_0 = const()[name = tensor("op_804_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_804_end_0 = const()[name = tensor("op_804_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_804_end_mask_0 = const()[name = tensor("op_804_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_804_cast_fp16 = slice_by_index(begin = var_804_begin_0, end = var_804_end_0, end_mask = var_804_end_mask_0, x = q_7_cast_fp16)[name = tensor("op_804_cast_fp16")]; + tensor var_808_begin_0 = const()[name = tensor("op_808_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_808_end_0 = const()[name = tensor("op_808_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_808_end_mask_0 = const()[name = tensor("op_808_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_808_cast_fp16 = slice_by_index(begin = var_808_begin_0, end = var_808_end_0, end_mask = var_808_end_mask_0, x = q_7_cast_fp16)[name = tensor("op_808_cast_fp16")]; + tensor k_15_perm_0 = const()[name = tensor("k_15_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_815_begin_0 = const()[name = tensor("op_815_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_815_end_0 = const()[name = tensor("op_815_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_815_end_mask_0 = const()[name = tensor("op_815_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_28 = transpose(perm = k_15_perm_0, x = k_13_cast_fp16)[name = tensor("transpose_28")]; + tensor var_815_cast_fp16 = slice_by_index(begin = var_815_begin_0, end = var_815_end_0, end_mask = var_815_end_mask_0, x = transpose_28)[name = tensor("op_815_cast_fp16")]; + tensor var_819_begin_0 = const()[name = tensor("op_819_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_819_end_0 = const()[name = tensor("op_819_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_819_end_mask_0 = const()[name = tensor("op_819_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_819_cast_fp16 = slice_by_index(begin = var_819_begin_0, end = var_819_end_0, end_mask = var_819_end_mask_0, x = transpose_28)[name = tensor("op_819_cast_fp16")]; + tensor var_823_begin_0 = const()[name = tensor("op_823_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_823_end_0 = const()[name = tensor("op_823_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_823_end_mask_0 = const()[name = tensor("op_823_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_823_cast_fp16 = slice_by_index(begin = var_823_begin_0, end = var_823_end_0, end_mask = var_823_end_mask_0, x = transpose_28)[name = tensor("op_823_cast_fp16")]; + tensor var_827_begin_0 = const()[name = tensor("op_827_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_827_end_0 = const()[name = tensor("op_827_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_827_end_mask_0 = const()[name = tensor("op_827_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_827_cast_fp16 = slice_by_index(begin = var_827_begin_0, end = var_827_end_0, end_mask = var_827_end_mask_0, x = transpose_28)[name = tensor("op_827_cast_fp16")]; + tensor var_831_begin_0 = const()[name = tensor("op_831_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_831_end_0 = const()[name = tensor("op_831_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_831_end_mask_0 = const()[name = tensor("op_831_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_831_cast_fp16 = slice_by_index(begin = var_831_begin_0, end = var_831_end_0, end_mask = var_831_end_mask_0, x = transpose_28)[name = tensor("op_831_cast_fp16")]; + tensor var_833_begin_0 = const()[name = tensor("op_833_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_833_end_0 = const()[name = tensor("op_833_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_833_end_mask_0 = const()[name = tensor("op_833_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_833_cast_fp16 = slice_by_index(begin = var_833_begin_0, end = var_833_end_0, end_mask = var_833_end_mask_0, x = v_7_cast_fp16)[name = tensor("op_833_cast_fp16")]; + tensor var_837_begin_0 = const()[name = tensor("op_837_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_837_end_0 = const()[name = tensor("op_837_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_837_end_mask_0 = const()[name = tensor("op_837_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_837_cast_fp16 = slice_by_index(begin = var_837_begin_0, end = var_837_end_0, end_mask = var_837_end_mask_0, x = v_7_cast_fp16)[name = tensor("op_837_cast_fp16")]; + tensor var_841_begin_0 = const()[name = tensor("op_841_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_841_end_0 = const()[name = tensor("op_841_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_841_end_mask_0 = const()[name = tensor("op_841_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_841_cast_fp16 = slice_by_index(begin = var_841_begin_0, end = var_841_end_0, end_mask = var_841_end_mask_0, x = v_7_cast_fp16)[name = tensor("op_841_cast_fp16")]; + tensor var_845_begin_0 = const()[name = tensor("op_845_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_845_end_0 = const()[name = tensor("op_845_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_845_end_mask_0 = const()[name = tensor("op_845_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_845_cast_fp16 = slice_by_index(begin = var_845_begin_0, end = var_845_end_0, end_mask = var_845_end_mask_0, x = v_7_cast_fp16)[name = tensor("op_845_cast_fp16")]; + tensor var_849_begin_0 = const()[name = tensor("op_849_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_849_end_0 = const()[name = tensor("op_849_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_849_end_mask_0 = const()[name = tensor("op_849_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_849_cast_fp16 = slice_by_index(begin = var_849_begin_0, end = var_849_end_0, end_mask = var_849_end_mask_0, x = v_7_cast_fp16)[name = tensor("op_849_cast_fp16")]; + tensor var_853_equation_0 = const()[name = tensor("op_853_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_853_cast_fp16 = einsum(equation = var_853_equation_0, values = (var_815_cast_fp16, var_792_cast_fp16))[name = tensor("op_853_cast_fp16")]; + tensor var_854_to_fp16 = const()[name = tensor("op_854_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_31_cast_fp16 = mul(x = var_853_cast_fp16, y = var_854_to_fp16)[name = tensor("aw_31_cast_fp16")]; + tensor var_857_equation_0 = const()[name = tensor("op_857_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_857_cast_fp16 = einsum(equation = var_857_equation_0, values = (var_819_cast_fp16, var_796_cast_fp16))[name = tensor("op_857_cast_fp16")]; + tensor var_858_to_fp16 = const()[name = tensor("op_858_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_33_cast_fp16 = mul(x = var_857_cast_fp16, y = var_858_to_fp16)[name = tensor("aw_33_cast_fp16")]; + tensor var_861_equation_0 = const()[name = tensor("op_861_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_861_cast_fp16 = einsum(equation = var_861_equation_0, values = (var_823_cast_fp16, var_800_cast_fp16))[name = tensor("op_861_cast_fp16")]; + tensor var_862_to_fp16 = const()[name = tensor("op_862_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_35_cast_fp16 = mul(x = var_861_cast_fp16, y = var_862_to_fp16)[name = tensor("aw_35_cast_fp16")]; + tensor var_865_equation_0 = const()[name = tensor("op_865_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_865_cast_fp16 = einsum(equation = var_865_equation_0, values = (var_827_cast_fp16, var_804_cast_fp16))[name = tensor("op_865_cast_fp16")]; + tensor var_866_to_fp16 = const()[name = tensor("op_866_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_37_cast_fp16 = mul(x = var_865_cast_fp16, y = var_866_to_fp16)[name = tensor("aw_37_cast_fp16")]; + tensor var_869_equation_0 = const()[name = tensor("op_869_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_869_cast_fp16 = einsum(equation = var_869_equation_0, values = (var_831_cast_fp16, var_808_cast_fp16))[name = tensor("op_869_cast_fp16")]; + tensor var_870_to_fp16 = const()[name = tensor("op_870_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_39_cast_fp16 = mul(x = var_869_cast_fp16, y = var_870_to_fp16)[name = tensor("aw_39_cast_fp16")]; + tensor var_872_cast_fp16 = softmax(axis = var_112, x = aw_31_cast_fp16)[name = tensor("op_872_cast_fp16")]; + tensor var_873_cast_fp16 = softmax(axis = var_112, x = aw_33_cast_fp16)[name = tensor("op_873_cast_fp16")]; + tensor var_874_cast_fp16 = softmax(axis = var_112, x = aw_35_cast_fp16)[name = tensor("op_874_cast_fp16")]; + tensor var_875_cast_fp16 = softmax(axis = var_112, x = aw_37_cast_fp16)[name = tensor("op_875_cast_fp16")]; + tensor var_876_cast_fp16 = softmax(axis = var_112, x = aw_39_cast_fp16)[name = tensor("op_876_cast_fp16")]; + tensor var_878_equation_0 = const()[name = tensor("op_878_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_878_cast_fp16 = einsum(equation = var_878_equation_0, values = (var_833_cast_fp16, var_872_cast_fp16))[name = tensor("op_878_cast_fp16")]; + tensor var_880_equation_0 = const()[name = tensor("op_880_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_880_cast_fp16 = einsum(equation = var_880_equation_0, values = (var_837_cast_fp16, var_873_cast_fp16))[name = tensor("op_880_cast_fp16")]; + tensor var_882_equation_0 = const()[name = tensor("op_882_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_882_cast_fp16 = einsum(equation = var_882_equation_0, values = (var_841_cast_fp16, var_874_cast_fp16))[name = tensor("op_882_cast_fp16")]; + tensor var_884_equation_0 = const()[name = tensor("op_884_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_884_cast_fp16 = einsum(equation = var_884_equation_0, values = (var_845_cast_fp16, var_875_cast_fp16))[name = tensor("op_884_cast_fp16")]; + tensor var_886_equation_0 = const()[name = tensor("op_886_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_886_cast_fp16 = einsum(equation = var_886_equation_0, values = (var_849_cast_fp16, var_876_cast_fp16))[name = tensor("op_886_cast_fp16")]; + tensor input_53_interleave_0 = const()[name = tensor("input_53_interleave_0"), val = tensor(false)]; + tensor input_53_cast_fp16 = concat(axis = var_112, interleave = input_53_interleave_0, values = (var_878_cast_fp16, var_880_cast_fp16, var_882_cast_fp16, var_884_cast_fp16, var_886_cast_fp16))[name = tensor("input_53_cast_fp16")]; + tensor var_892 = const()[name = tensor("op_892"), val = tensor([1, 1])]; + tensor var_894 = const()[name = tensor("op_894"), val = tensor([1, 1])]; + tensor var_896_pad_type_0 = const()[name = tensor("op_896_pad_type_0"), val = tensor("custom")]; + tensor var_896_pad_0 = const()[name = tensor("op_896_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21115968)))]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21320832)))]; + tensor var_896_cast_fp16 = conv(bias = down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_894, groups = var_112, pad = var_896_pad_0, pad_type = var_896_pad_type_0, strides = var_892, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_53_cast_fp16)[name = tensor("op_896_cast_fp16")]; + tensor inputs_11_cast_fp16 = add(x = var_896_cast_fp16, y = inputs_9_cast_fp16)[name = tensor("inputs_11_cast_fp16")]; + tensor var_900 = const()[name = tensor("op_900"), val = tensor([1])]; + tensor channels_mean_11_cast_fp16 = reduce_mean(axes = var_900, keep_dims = var_107, x = inputs_11_cast_fp16)[name = tensor("channels_mean_11_cast_fp16")]; + tensor zero_mean_11_cast_fp16 = sub(x = inputs_11_cast_fp16, y = channels_mean_11_cast_fp16)[name = tensor("zero_mean_11_cast_fp16")]; + tensor zero_mean_sq_11_cast_fp16 = mul(x = zero_mean_11_cast_fp16, y = zero_mean_11_cast_fp16)[name = tensor("zero_mean_sq_11_cast_fp16")]; + tensor var_904 = const()[name = tensor("op_904"), val = tensor([1])]; + tensor var_905_cast_fp16 = reduce_mean(axes = var_904, keep_dims = var_107, x = zero_mean_sq_11_cast_fp16)[name = tensor("op_905_cast_fp16")]; + tensor var_906_to_fp16 = const()[name = tensor("op_906_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_907_cast_fp16 = add(x = var_905_cast_fp16, y = var_906_to_fp16)[name = tensor("op_907_cast_fp16")]; + tensor denom_11_epsilon_0_to_fp16 = const()[name = tensor("denom_11_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_11_cast_fp16 = rsqrt(epsilon = denom_11_epsilon_0_to_fp16, x = var_907_cast_fp16)[name = tensor("denom_11_cast_fp16")]; + tensor out_11_cast_fp16 = mul(x = zero_mean_11_cast_fp16, y = denom_11_cast_fp16)[name = tensor("out_11_cast_fp16")]; + tensor var_911_to_fp16 = const()[name = tensor("op_911_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21321536)))]; + tensor var_912_cast_fp16 = add(x = out_11_cast_fp16, y = var_911_to_fp16)[name = tensor("op_912_cast_fp16")]; + tensor var_914_to_fp16 = const()[name = tensor("op_914_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21322240)))]; + tensor input_55_cast_fp16 = mul(x = var_912_cast_fp16, y = var_914_to_fp16)[name = tensor("input_55_cast_fp16")]; + tensor var_922 = const()[name = tensor("op_922"), val = tensor([1, 1])]; + tensor var_924 = const()[name = tensor("op_924"), val = tensor([1, 1])]; + tensor var_926_pad_type_0 = const()[name = tensor("op_926_pad_type_0"), val = tensor("custom")]; + tensor var_926_pad_0 = const()[name = tensor("op_926_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21322944)))]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22961408)))]; + tensor var_926_cast_fp16 = conv(bias = down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_924, groups = var_112, pad = var_926_pad_0, pad_type = var_926_pad_type_0, strides = var_922, weight = down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("op_926_cast_fp16")]; + tensor var_927_split_sizes_0 = const()[name = tensor("op_927_split_sizes_0"), val = tensor([1280, 1280])]; + tensor var_927_axis_0 = const()[name = tensor("op_927_axis_0"), val = tensor(1)]; + tensor var_927_cast_fp16_0, tensor var_927_cast_fp16_1 = split(axis = var_927_axis_0, split_sizes = var_927_split_sizes_0, x = var_926_cast_fp16)[name = tensor("op_927_cast_fp16")]; + tensor var_929_mode_0 = const()[name = tensor("op_929_mode_0"), val = tensor("EXACT")]; + tensor var_929_cast_fp16 = gelu(mode = var_929_mode_0, x = var_927_cast_fp16_1)[name = tensor("op_929_cast_fp16")]; + tensor input_57_cast_fp16 = mul(x = var_927_cast_fp16_0, y = var_929_cast_fp16)[name = tensor("input_57_cast_fp16")]; + tensor var_933 = const()[name = tensor("op_933"), val = tensor([1, 1])]; + tensor var_935 = const()[name = tensor("op_935"), val = tensor([1, 1])]; + tensor var_937_pad_type_0 = const()[name = tensor("op_937_pad_type_0"), val = tensor("custom")]; + tensor var_937_pad_0 = const()[name = tensor("op_937_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22966592)))]; + tensor down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23785856)))]; + tensor var_937_cast_fp16 = conv(bias = down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_935, groups = var_112, pad = var_937_pad_0, pad_type = var_937_pad_type_0, strides = var_933, weight = down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_57_cast_fp16)[name = tensor("op_937_cast_fp16")]; + tensor hidden_states_33_cast_fp16 = add(x = var_937_cast_fp16, y = inputs_11_cast_fp16)[name = tensor("hidden_states_33_cast_fp16")]; + tensor var_939 = const()[name = tensor("op_939"), val = tensor([2, 320, 48, 48])]; + tensor input_59_cast_fp16 = reshape(shape = var_939, x = hidden_states_33_cast_fp16)[name = tensor("input_59_cast_fp16")]; + tensor var_943 = const()[name = tensor("op_943"), val = tensor([1, 1])]; + tensor var_945 = const()[name = tensor("op_945"), val = tensor([1, 1])]; + tensor hidden_states_35_pad_type_0 = const()[name = tensor("hidden_states_35_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_35_pad_0 = const()[name = tensor("hidden_states_35_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_0_attentions_1_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23786560)))]; + tensor down_blocks_0_attentions_1_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23991424)))]; + tensor hidden_states_35_cast_fp16 = conv(bias = down_blocks_0_attentions_1_proj_out_bias_to_fp16, dilations = var_945, groups = var_112, pad = hidden_states_35_pad_0, pad_type = hidden_states_35_pad_type_0, strides = var_943, weight = down_blocks_0_attentions_1_proj_out_weight_to_fp16, x = input_59_cast_fp16)[name = tensor("hidden_states_35_cast_fp16")]; + tensor input_61_cast_fp16 = add(x = hidden_states_35_cast_fp16, y = hidden_states_23_cast_fp16)[name = tensor("input_61_cast_fp16")]; + tensor var_952 = const()[name = tensor("op_952"), val = tensor([2, 2])]; + tensor var_954 = const()[name = tensor("op_954"), val = tensor([1, 1])]; + tensor input_63_pad_type_0 = const()[name = tensor("input_63_pad_type_0"), val = tensor("custom")]; + tensor input_63_pad_0 = const()[name = tensor("input_63_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_0_downsamplers_0_conv_weight_to_fp16 = const()[name = tensor("down_blocks_0_downsamplers_0_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23992128)))]; + tensor down_blocks_0_downsamplers_0_conv_bias_to_fp16 = const()[name = tensor("down_blocks_0_downsamplers_0_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25835392)))]; + tensor input_63_cast_fp16 = conv(bias = down_blocks_0_downsamplers_0_conv_bias_to_fp16, dilations = var_954, groups = var_112, pad = input_63_pad_0, pad_type = input_63_pad_type_0, strides = var_952, weight = down_blocks_0_downsamplers_0_conv_weight_to_fp16, x = input_61_cast_fp16)[name = tensor("input_63_cast_fp16")]; + tensor var_979 = const()[name = tensor("op_979"), val = tensor(true)]; + tensor var_984 = const()[name = tensor("op_984"), val = tensor(1)]; + tensor reshape_24_shape_0 = const()[name = tensor("reshape_24_shape_0"), val = tensor([2, 32, 10, 24, 24])]; + tensor reshape_24_cast_fp16 = reshape(shape = reshape_24_shape_0, x = input_63_cast_fp16)[name = tensor("reshape_24_cast_fp16")]; + tensor reduce_mean_18_axes_0 = const()[name = tensor("reduce_mean_18_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_18_keep_dims_0 = const()[name = tensor("reduce_mean_18_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_18_cast_fp16 = reduce_mean(axes = reduce_mean_18_axes_0, keep_dims = reduce_mean_18_keep_dims_0, x = reshape_24_cast_fp16)[name = tensor("reduce_mean_18_cast_fp16")]; + tensor sub_12_cast_fp16 = sub(x = reshape_24_cast_fp16, y = reduce_mean_18_cast_fp16)[name = tensor("sub_12_cast_fp16")]; + tensor square_6_cast_fp16 = square(x = sub_12_cast_fp16)[name = tensor("square_6_cast_fp16")]; + tensor reduce_mean_20_axes_0 = const()[name = tensor("reduce_mean_20_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_20_keep_dims_0 = const()[name = tensor("reduce_mean_20_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_20_cast_fp16 = reduce_mean(axes = reduce_mean_20_axes_0, keep_dims = reduce_mean_20_keep_dims_0, x = square_6_cast_fp16)[name = tensor("reduce_mean_20_cast_fp16")]; + tensor add_12_y_0_to_fp16 = const()[name = tensor("add_12_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_12_cast_fp16 = add(x = reduce_mean_20_cast_fp16, y = add_12_y_0_to_fp16)[name = tensor("add_12_cast_fp16")]; + tensor sqrt_6_cast_fp16 = sqrt(x = add_12_cast_fp16)[name = tensor("sqrt_6_cast_fp16")]; + tensor real_div_6_cast_fp16 = real_div(x = sub_12_cast_fp16, y = sqrt_6_cast_fp16)[name = tensor("real_div_6_cast_fp16")]; + tensor reshape_25_shape_0 = const()[name = tensor("reshape_25_shape_0"), val = tensor([2, 320, 24, 24])]; + tensor reshape_25_cast_fp16 = reshape(shape = reshape_25_shape_0, x = real_div_6_cast_fp16)[name = tensor("reshape_25_cast_fp16")]; + tensor add_13_gamma_0_to_fp16 = const()[name = tensor("add_13_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25836096)))]; + tensor add_13_beta_0_to_fp16 = const()[name = tensor("add_13_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25836800)))]; + tensor add_13_epsilon_0_to_fp16 = const()[name = tensor("add_13_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_13_cast_fp16 = batch_norm(beta = add_13_beta_0_to_fp16, epsilon = add_13_epsilon_0_to_fp16, gamma = add_13_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_25_cast_fp16)[name = tensor("add_13_cast_fp16")]; + tensor input_67_cast_fp16 = silu(x = add_13_cast_fp16)[name = tensor("input_67_cast_fp16")]; + tensor var_1007 = const()[name = tensor("op_1007"), val = tensor([1, 1])]; + tensor var_1009 = const()[name = tensor("op_1009"), val = tensor([1, 1])]; + tensor hidden_states_37_pad_type_0 = const()[name = tensor("hidden_states_37_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_37_pad_0 = const()[name = tensor("hidden_states_37_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_1_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25837504)))]; + tensor down_blocks_1_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29523968)))]; + tensor hidden_states_37_cast_fp16 = conv(bias = down_blocks_1_resnets_0_conv1_bias_to_fp16, dilations = var_1009, groups = var_984, pad = hidden_states_37_pad_0, pad_type = hidden_states_37_pad_type_0, strides = var_1007, weight = down_blocks_1_resnets_0_conv1_weight_to_fp16, x = input_67_cast_fp16)[name = tensor("hidden_states_37_cast_fp16")]; + tensor var_1015 = const()[name = tensor("op_1015"), val = tensor([1, 1])]; + tensor var_1017 = const()[name = tensor("op_1017"), val = tensor([1, 1])]; + tensor temb_5_pad_type_0 = const()[name = tensor("temb_5_pad_type_0"), val = tensor("custom")]; + tensor temb_5_pad_0 = const()[name = tensor("temb_5_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29525312)))]; + tensor down_blocks_1_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31163776)))]; + tensor temb_5_cast_fp16 = conv(bias = down_blocks_1_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_1017, groups = var_984, pad = temb_5_pad_0, pad_type = temb_5_pad_type_0, strides = var_1015, weight = down_blocks_1_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_5_cast_fp16")]; + tensor input_71_cast_fp16 = add(x = hidden_states_37_cast_fp16, y = temb_5_cast_fp16)[name = tensor("input_71_cast_fp16")]; + tensor reshape_28_shape_0 = const()[name = tensor("reshape_28_shape_0"), val = tensor([2, 32, 20, 24, 24])]; + tensor reshape_28_cast_fp16 = reshape(shape = reshape_28_shape_0, x = input_71_cast_fp16)[name = tensor("reshape_28_cast_fp16")]; + tensor reduce_mean_21_axes_0 = const()[name = tensor("reduce_mean_21_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_21_keep_dims_0 = const()[name = tensor("reduce_mean_21_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_21_cast_fp16 = reduce_mean(axes = reduce_mean_21_axes_0, keep_dims = reduce_mean_21_keep_dims_0, x = reshape_28_cast_fp16)[name = tensor("reduce_mean_21_cast_fp16")]; + tensor sub_14_cast_fp16 = sub(x = reshape_28_cast_fp16, y = reduce_mean_21_cast_fp16)[name = tensor("sub_14_cast_fp16")]; + tensor square_7_cast_fp16 = square(x = sub_14_cast_fp16)[name = tensor("square_7_cast_fp16")]; + tensor reduce_mean_23_axes_0 = const()[name = tensor("reduce_mean_23_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_23_keep_dims_0 = const()[name = tensor("reduce_mean_23_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_23_cast_fp16 = reduce_mean(axes = reduce_mean_23_axes_0, keep_dims = reduce_mean_23_keep_dims_0, x = square_7_cast_fp16)[name = tensor("reduce_mean_23_cast_fp16")]; + tensor add_14_y_0_to_fp16 = const()[name = tensor("add_14_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_14_cast_fp16 = add(x = reduce_mean_23_cast_fp16, y = add_14_y_0_to_fp16)[name = tensor("add_14_cast_fp16")]; + tensor sqrt_7_cast_fp16 = sqrt(x = add_14_cast_fp16)[name = tensor("sqrt_7_cast_fp16")]; + tensor real_div_7_cast_fp16 = real_div(x = sub_14_cast_fp16, y = sqrt_7_cast_fp16)[name = tensor("real_div_7_cast_fp16")]; + tensor reshape_29_shape_0 = const()[name = tensor("reshape_29_shape_0"), val = tensor([2, 640, 24, 24])]; + tensor reshape_29_cast_fp16 = reshape(shape = reshape_29_shape_0, x = real_div_7_cast_fp16)[name = tensor("reshape_29_cast_fp16")]; + tensor add_15_mean_0_to_fp16 = const()[name = tensor("add_15_mean_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31165120)))]; + tensor add_15_variance_0_to_fp16 = const()[name = tensor("add_15_variance_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31166464)))]; + tensor add_15_gamma_0_to_fp16 = const()[name = tensor("add_15_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31167808)))]; + tensor add_15_beta_0_to_fp16 = const()[name = tensor("add_15_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31169152)))]; + tensor add_15_epsilon_0_to_fp16 = const()[name = tensor("add_15_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_15_cast_fp16 = batch_norm(beta = add_15_beta_0_to_fp16, epsilon = add_15_epsilon_0_to_fp16, gamma = add_15_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_29_cast_fp16)[name = tensor("add_15_cast_fp16")]; + tensor input_75_cast_fp16 = silu(x = add_15_cast_fp16)[name = tensor("input_75_cast_fp16")]; + tensor var_1027 = const()[name = tensor("op_1027"), val = tensor([1, 1])]; + tensor var_1029 = const()[name = tensor("op_1029"), val = tensor([1, 1])]; + tensor hidden_states_39_pad_type_0 = const()[name = tensor("hidden_states_39_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_39_pad_0 = const()[name = tensor("hidden_states_39_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_1_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31170496)))]; + tensor down_blocks_1_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38543360)))]; + tensor hidden_states_39_cast_fp16 = conv(bias = down_blocks_1_resnets_0_conv2_bias_to_fp16, dilations = var_1029, groups = var_984, pad = hidden_states_39_pad_0, pad_type = hidden_states_39_pad_type_0, strides = var_1027, weight = down_blocks_1_resnets_0_conv2_weight_to_fp16, x = input_75_cast_fp16)[name = tensor("hidden_states_39_cast_fp16")]; + tensor var_1034 = const()[name = tensor("op_1034"), val = tensor([1, 1])]; + tensor var_1036 = const()[name = tensor("op_1036"), val = tensor([1, 1])]; + tensor x_1_pad_type_0 = const()[name = tensor("x_1_pad_type_0"), val = tensor("custom")]; + tensor x_1_pad_0 = const()[name = tensor("x_1_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_resnets_0_conv_shortcut_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38544704)))]; + tensor down_blocks_1_resnets_0_conv_shortcut_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38954368)))]; + tensor x_1_cast_fp16 = conv(bias = down_blocks_1_resnets_0_conv_shortcut_bias_to_fp16, dilations = var_1036, groups = var_984, pad = x_1_pad_0, pad_type = x_1_pad_type_0, strides = var_1034, weight = down_blocks_1_resnets_0_conv_shortcut_weight_to_fp16, x = input_63_cast_fp16)[name = tensor("x_1_cast_fp16")]; + tensor hidden_states_41_cast_fp16 = add(x = x_1_cast_fp16, y = hidden_states_39_cast_fp16)[name = tensor("hidden_states_41_cast_fp16")]; + tensor reshape_32_shape_0 = const()[name = tensor("reshape_32_shape_0"), val = tensor([2, 32, 20, 24, 24])]; + tensor reshape_32_cast_fp16 = reshape(shape = reshape_32_shape_0, x = hidden_states_41_cast_fp16)[name = tensor("reshape_32_cast_fp16")]; + tensor reduce_mean_24_axes_0 = const()[name = tensor("reduce_mean_24_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_24_keep_dims_0 = const()[name = tensor("reduce_mean_24_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_24_cast_fp16 = reduce_mean(axes = reduce_mean_24_axes_0, keep_dims = reduce_mean_24_keep_dims_0, x = reshape_32_cast_fp16)[name = tensor("reduce_mean_24_cast_fp16")]; + tensor sub_16_cast_fp16 = sub(x = reshape_32_cast_fp16, y = reduce_mean_24_cast_fp16)[name = tensor("sub_16_cast_fp16")]; + tensor square_8_cast_fp16 = square(x = sub_16_cast_fp16)[name = tensor("square_8_cast_fp16")]; + tensor reduce_mean_26_axes_0 = const()[name = tensor("reduce_mean_26_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_26_keep_dims_0 = const()[name = tensor("reduce_mean_26_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_26_cast_fp16 = reduce_mean(axes = reduce_mean_26_axes_0, keep_dims = reduce_mean_26_keep_dims_0, x = square_8_cast_fp16)[name = tensor("reduce_mean_26_cast_fp16")]; + tensor add_16_y_0_to_fp16 = const()[name = tensor("add_16_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_16_cast_fp16 = add(x = reduce_mean_26_cast_fp16, y = add_16_y_0_to_fp16)[name = tensor("add_16_cast_fp16")]; + tensor sqrt_8_cast_fp16 = sqrt(x = add_16_cast_fp16)[name = tensor("sqrt_8_cast_fp16")]; + tensor real_div_8_cast_fp16 = real_div(x = sub_16_cast_fp16, y = sqrt_8_cast_fp16)[name = tensor("real_div_8_cast_fp16")]; + tensor reshape_33_shape_0 = const()[name = tensor("reshape_33_shape_0"), val = tensor([2, 640, 24, 24])]; + tensor reshape_33_cast_fp16 = reshape(shape = reshape_33_shape_0, x = real_div_8_cast_fp16)[name = tensor("reshape_33_cast_fp16")]; + tensor add_17_gamma_0_to_fp16 = const()[name = tensor("add_17_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38955712)))]; + tensor add_17_beta_0_to_fp16 = const()[name = tensor("add_17_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38957056)))]; + tensor add_17_epsilon_0_to_fp16 = const()[name = tensor("add_17_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_17_cast_fp16 = batch_norm(beta = add_17_beta_0_to_fp16, epsilon = add_17_epsilon_0_to_fp16, gamma = add_17_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_33_cast_fp16)[name = tensor("add_17_cast_fp16")]; + tensor var_1056 = const()[name = tensor("op_1056"), val = tensor([1, 1])]; + tensor var_1058 = const()[name = tensor("op_1058"), val = tensor([1, 1])]; + tensor hidden_states_43_pad_type_0 = const()[name = tensor("hidden_states_43_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_43_pad_0 = const()[name = tensor("hidden_states_43_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38958400)))]; + tensor down_blocks_1_attentions_0_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39777664)))]; + tensor hidden_states_43_cast_fp16 = conv(bias = down_blocks_1_attentions_0_proj_in_bias_to_fp16, dilations = var_1058, groups = var_984, pad = hidden_states_43_pad_0, pad_type = hidden_states_43_pad_type_0, strides = var_1056, weight = down_blocks_1_attentions_0_proj_in_weight_to_fp16, x = add_17_cast_fp16)[name = tensor("hidden_states_43_cast_fp16")]; + tensor var_1063 = const()[name = tensor("op_1063"), val = tensor([2, 640, 1, 576])]; + tensor inputs_13_cast_fp16 = reshape(shape = var_1063, x = hidden_states_43_cast_fp16)[name = tensor("inputs_13_cast_fp16")]; + tensor var_1073 = const()[name = tensor("op_1073"), val = tensor([1])]; + tensor channels_mean_13_cast_fp16 = reduce_mean(axes = var_1073, keep_dims = var_979, x = inputs_13_cast_fp16)[name = tensor("channels_mean_13_cast_fp16")]; + tensor zero_mean_13_cast_fp16 = sub(x = inputs_13_cast_fp16, y = channels_mean_13_cast_fp16)[name = tensor("zero_mean_13_cast_fp16")]; + tensor zero_mean_sq_13_cast_fp16 = mul(x = zero_mean_13_cast_fp16, y = zero_mean_13_cast_fp16)[name = tensor("zero_mean_sq_13_cast_fp16")]; + tensor var_1077 = const()[name = tensor("op_1077"), val = tensor([1])]; + tensor var_1078_cast_fp16 = reduce_mean(axes = var_1077, keep_dims = var_979, x = zero_mean_sq_13_cast_fp16)[name = tensor("op_1078_cast_fp16")]; + tensor var_1079_to_fp16 = const()[name = tensor("op_1079_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1080_cast_fp16 = add(x = var_1078_cast_fp16, y = var_1079_to_fp16)[name = tensor("op_1080_cast_fp16")]; + tensor denom_13_epsilon_0_to_fp16 = const()[name = tensor("denom_13_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_13_cast_fp16 = rsqrt(epsilon = denom_13_epsilon_0_to_fp16, x = var_1080_cast_fp16)[name = tensor("denom_13_cast_fp16")]; + tensor out_13_cast_fp16 = mul(x = zero_mean_13_cast_fp16, y = denom_13_cast_fp16)[name = tensor("out_13_cast_fp16")]; + tensor var_1084_to_fp16 = const()[name = tensor("op_1084_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39779008)))]; + tensor var_1085_cast_fp16 = add(x = out_13_cast_fp16, y = var_1084_to_fp16)[name = tensor("op_1085_cast_fp16")]; + tensor var_1087_to_fp16 = const()[name = tensor("op_1087_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39780352)))]; + tensor hidden_states_45_cast_fp16 = mul(x = var_1085_cast_fp16, y = var_1087_to_fp16)[name = tensor("hidden_states_45_cast_fp16")]; + tensor var_1094 = const()[name = tensor("op_1094"), val = tensor([1, 1])]; + tensor var_1096 = const()[name = tensor("op_1096"), val = tensor([1, 1])]; + tensor q_9_pad_type_0 = const()[name = tensor("q_9_pad_type_0"), val = tensor("custom")]; + tensor q_9_pad_0 = const()[name = tensor("q_9_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39781696)))]; + tensor q_9_cast_fp16 = conv(dilations = var_1096, groups = var_984, pad = q_9_pad_0, pad_type = q_9_pad_type_0, strides = var_1094, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_45_cast_fp16)[name = tensor("q_9_cast_fp16")]; + tensor var_1100 = const()[name = tensor("op_1100"), val = tensor([1, 1])]; + tensor var_1102 = const()[name = tensor("op_1102"), val = tensor([1, 1])]; + tensor k_17_pad_type_0 = const()[name = tensor("k_17_pad_type_0"), val = tensor("custom")]; + tensor k_17_pad_0 = const()[name = tensor("k_17_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40600960)))]; + tensor k_17_cast_fp16 = conv(dilations = var_1102, groups = var_984, pad = k_17_pad_0, pad_type = k_17_pad_type_0, strides = var_1100, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_45_cast_fp16)[name = tensor("k_17_cast_fp16")]; + tensor var_1106 = const()[name = tensor("op_1106"), val = tensor([1, 1])]; + tensor var_1108 = const()[name = tensor("op_1108"), val = tensor([1, 1])]; + tensor v_9_pad_type_0 = const()[name = tensor("v_9_pad_type_0"), val = tensor("custom")]; + tensor v_9_pad_0 = const()[name = tensor("v_9_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41420224)))]; + tensor v_9_cast_fp16 = conv(dilations = var_1108, groups = var_984, pad = v_9_pad_0, pad_type = v_9_pad_type_0, strides = var_1106, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_45_cast_fp16)[name = tensor("v_9_cast_fp16")]; + tensor var_1112_begin_0 = const()[name = tensor("op_1112_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_1112_end_0 = const()[name = tensor("op_1112_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_1112_end_mask_0 = const()[name = tensor("op_1112_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1112_cast_fp16 = slice_by_index(begin = var_1112_begin_0, end = var_1112_end_0, end_mask = var_1112_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1112_cast_fp16")]; + tensor var_1116_begin_0 = const()[name = tensor("op_1116_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_1116_end_0 = const()[name = tensor("op_1116_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_1116_end_mask_0 = const()[name = tensor("op_1116_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1116_cast_fp16 = slice_by_index(begin = var_1116_begin_0, end = var_1116_end_0, end_mask = var_1116_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1116_cast_fp16")]; + tensor var_1120_begin_0 = const()[name = tensor("op_1120_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_1120_end_0 = const()[name = tensor("op_1120_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_1120_end_mask_0 = const()[name = tensor("op_1120_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1120_cast_fp16 = slice_by_index(begin = var_1120_begin_0, end = var_1120_end_0, end_mask = var_1120_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1120_cast_fp16")]; + tensor var_1124_begin_0 = const()[name = tensor("op_1124_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_1124_end_0 = const()[name = tensor("op_1124_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_1124_end_mask_0 = const()[name = tensor("op_1124_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1124_cast_fp16 = slice_by_index(begin = var_1124_begin_0, end = var_1124_end_0, end_mask = var_1124_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1124_cast_fp16")]; + tensor var_1128_begin_0 = const()[name = tensor("op_1128_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_1128_end_0 = const()[name = tensor("op_1128_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_1128_end_mask_0 = const()[name = tensor("op_1128_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1128_cast_fp16 = slice_by_index(begin = var_1128_begin_0, end = var_1128_end_0, end_mask = var_1128_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1128_cast_fp16")]; + tensor var_1132_begin_0 = const()[name = tensor("op_1132_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_1132_end_0 = const()[name = tensor("op_1132_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_1132_end_mask_0 = const()[name = tensor("op_1132_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1132_cast_fp16 = slice_by_index(begin = var_1132_begin_0, end = var_1132_end_0, end_mask = var_1132_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1132_cast_fp16")]; + tensor var_1136_begin_0 = const()[name = tensor("op_1136_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_1136_end_0 = const()[name = tensor("op_1136_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_1136_end_mask_0 = const()[name = tensor("op_1136_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1136_cast_fp16 = slice_by_index(begin = var_1136_begin_0, end = var_1136_end_0, end_mask = var_1136_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1136_cast_fp16")]; + tensor var_1140_begin_0 = const()[name = tensor("op_1140_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_1140_end_0 = const()[name = tensor("op_1140_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_1140_end_mask_0 = const()[name = tensor("op_1140_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1140_cast_fp16 = slice_by_index(begin = var_1140_begin_0, end = var_1140_end_0, end_mask = var_1140_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1140_cast_fp16")]; + tensor var_1144_begin_0 = const()[name = tensor("op_1144_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_1144_end_0 = const()[name = tensor("op_1144_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_1144_end_mask_0 = const()[name = tensor("op_1144_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1144_cast_fp16 = slice_by_index(begin = var_1144_begin_0, end = var_1144_end_0, end_mask = var_1144_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1144_cast_fp16")]; + tensor var_1148_begin_0 = const()[name = tensor("op_1148_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_1148_end_0 = const()[name = tensor("op_1148_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_1148_end_mask_0 = const()[name = tensor("op_1148_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1148_cast_fp16 = slice_by_index(begin = var_1148_begin_0, end = var_1148_end_0, end_mask = var_1148_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1148_cast_fp16")]; + tensor k_19_perm_0 = const()[name = tensor("k_19_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_1155_begin_0 = const()[name = tensor("op_1155_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_1155_end_0 = const()[name = tensor("op_1155_end_0"), val = tensor([2, 576, 1, 64])]; + tensor var_1155_end_mask_0 = const()[name = tensor("op_1155_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_27 = transpose(perm = k_19_perm_0, x = k_17_cast_fp16)[name = tensor("transpose_27")]; + tensor var_1155_cast_fp16 = slice_by_index(begin = var_1155_begin_0, end = var_1155_end_0, end_mask = var_1155_end_mask_0, x = transpose_27)[name = tensor("op_1155_cast_fp16")]; + tensor var_1159_begin_0 = const()[name = tensor("op_1159_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_1159_end_0 = const()[name = tensor("op_1159_end_0"), val = tensor([2, 576, 1, 128])]; + tensor var_1159_end_mask_0 = const()[name = tensor("op_1159_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1159_cast_fp16 = slice_by_index(begin = var_1159_begin_0, end = var_1159_end_0, end_mask = var_1159_end_mask_0, x = transpose_27)[name = tensor("op_1159_cast_fp16")]; + tensor var_1163_begin_0 = const()[name = tensor("op_1163_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_1163_end_0 = const()[name = tensor("op_1163_end_0"), val = tensor([2, 576, 1, 192])]; + tensor var_1163_end_mask_0 = const()[name = tensor("op_1163_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1163_cast_fp16 = slice_by_index(begin = var_1163_begin_0, end = var_1163_end_0, end_mask = var_1163_end_mask_0, x = transpose_27)[name = tensor("op_1163_cast_fp16")]; + tensor var_1167_begin_0 = const()[name = tensor("op_1167_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_1167_end_0 = const()[name = tensor("op_1167_end_0"), val = tensor([2, 576, 1, 256])]; + tensor var_1167_end_mask_0 = const()[name = tensor("op_1167_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1167_cast_fp16 = slice_by_index(begin = var_1167_begin_0, end = var_1167_end_0, end_mask = var_1167_end_mask_0, x = transpose_27)[name = tensor("op_1167_cast_fp16")]; + tensor var_1171_begin_0 = const()[name = tensor("op_1171_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_1171_end_0 = const()[name = tensor("op_1171_end_0"), val = tensor([2, 576, 1, 320])]; + tensor var_1171_end_mask_0 = const()[name = tensor("op_1171_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1171_cast_fp16 = slice_by_index(begin = var_1171_begin_0, end = var_1171_end_0, end_mask = var_1171_end_mask_0, x = transpose_27)[name = tensor("op_1171_cast_fp16")]; + tensor var_1175_begin_0 = const()[name = tensor("op_1175_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_1175_end_0 = const()[name = tensor("op_1175_end_0"), val = tensor([2, 576, 1, 384])]; + tensor var_1175_end_mask_0 = const()[name = tensor("op_1175_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1175_cast_fp16 = slice_by_index(begin = var_1175_begin_0, end = var_1175_end_0, end_mask = var_1175_end_mask_0, x = transpose_27)[name = tensor("op_1175_cast_fp16")]; + tensor var_1179_begin_0 = const()[name = tensor("op_1179_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_1179_end_0 = const()[name = tensor("op_1179_end_0"), val = tensor([2, 576, 1, 448])]; + tensor var_1179_end_mask_0 = const()[name = tensor("op_1179_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1179_cast_fp16 = slice_by_index(begin = var_1179_begin_0, end = var_1179_end_0, end_mask = var_1179_end_mask_0, x = transpose_27)[name = tensor("op_1179_cast_fp16")]; + tensor var_1183_begin_0 = const()[name = tensor("op_1183_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_1183_end_0 = const()[name = tensor("op_1183_end_0"), val = tensor([2, 576, 1, 512])]; + tensor var_1183_end_mask_0 = const()[name = tensor("op_1183_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1183_cast_fp16 = slice_by_index(begin = var_1183_begin_0, end = var_1183_end_0, end_mask = var_1183_end_mask_0, x = transpose_27)[name = tensor("op_1183_cast_fp16")]; + tensor var_1187_begin_0 = const()[name = tensor("op_1187_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_1187_end_0 = const()[name = tensor("op_1187_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_1187_end_mask_0 = const()[name = tensor("op_1187_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1187_cast_fp16 = slice_by_index(begin = var_1187_begin_0, end = var_1187_end_0, end_mask = var_1187_end_mask_0, x = transpose_27)[name = tensor("op_1187_cast_fp16")]; + tensor var_1191_begin_0 = const()[name = tensor("op_1191_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_1191_end_0 = const()[name = tensor("op_1191_end_0"), val = tensor([2, 576, 1, 640])]; + tensor var_1191_end_mask_0 = const()[name = tensor("op_1191_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1191_cast_fp16 = slice_by_index(begin = var_1191_begin_0, end = var_1191_end_0, end_mask = var_1191_end_mask_0, x = transpose_27)[name = tensor("op_1191_cast_fp16")]; + tensor var_1193_begin_0 = const()[name = tensor("op_1193_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_1193_end_0 = const()[name = tensor("op_1193_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_1193_end_mask_0 = const()[name = tensor("op_1193_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1193_cast_fp16 = slice_by_index(begin = var_1193_begin_0, end = var_1193_end_0, end_mask = var_1193_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1193_cast_fp16")]; + tensor var_1197_begin_0 = const()[name = tensor("op_1197_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_1197_end_0 = const()[name = tensor("op_1197_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_1197_end_mask_0 = const()[name = tensor("op_1197_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1197_cast_fp16 = slice_by_index(begin = var_1197_begin_0, end = var_1197_end_0, end_mask = var_1197_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1197_cast_fp16")]; + tensor var_1201_begin_0 = const()[name = tensor("op_1201_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_1201_end_0 = const()[name = tensor("op_1201_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_1201_end_mask_0 = const()[name = tensor("op_1201_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1201_cast_fp16 = slice_by_index(begin = var_1201_begin_0, end = var_1201_end_0, end_mask = var_1201_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1201_cast_fp16")]; + tensor var_1205_begin_0 = const()[name = tensor("op_1205_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_1205_end_0 = const()[name = tensor("op_1205_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_1205_end_mask_0 = const()[name = tensor("op_1205_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1205_cast_fp16 = slice_by_index(begin = var_1205_begin_0, end = var_1205_end_0, end_mask = var_1205_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1205_cast_fp16")]; + tensor var_1209_begin_0 = const()[name = tensor("op_1209_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_1209_end_0 = const()[name = tensor("op_1209_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_1209_end_mask_0 = const()[name = tensor("op_1209_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1209_cast_fp16 = slice_by_index(begin = var_1209_begin_0, end = var_1209_end_0, end_mask = var_1209_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1209_cast_fp16")]; + tensor var_1213_begin_0 = const()[name = tensor("op_1213_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_1213_end_0 = const()[name = tensor("op_1213_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_1213_end_mask_0 = const()[name = tensor("op_1213_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1213_cast_fp16 = slice_by_index(begin = var_1213_begin_0, end = var_1213_end_0, end_mask = var_1213_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1213_cast_fp16")]; + tensor var_1217_begin_0 = const()[name = tensor("op_1217_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_1217_end_0 = const()[name = tensor("op_1217_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_1217_end_mask_0 = const()[name = tensor("op_1217_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1217_cast_fp16 = slice_by_index(begin = var_1217_begin_0, end = var_1217_end_0, end_mask = var_1217_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1217_cast_fp16")]; + tensor var_1221_begin_0 = const()[name = tensor("op_1221_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_1221_end_0 = const()[name = tensor("op_1221_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_1221_end_mask_0 = const()[name = tensor("op_1221_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1221_cast_fp16 = slice_by_index(begin = var_1221_begin_0, end = var_1221_end_0, end_mask = var_1221_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1221_cast_fp16")]; + tensor var_1225_begin_0 = const()[name = tensor("op_1225_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_1225_end_0 = const()[name = tensor("op_1225_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_1225_end_mask_0 = const()[name = tensor("op_1225_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1225_cast_fp16 = slice_by_index(begin = var_1225_begin_0, end = var_1225_end_0, end_mask = var_1225_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1225_cast_fp16")]; + tensor var_1229_begin_0 = const()[name = tensor("op_1229_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_1229_end_0 = const()[name = tensor("op_1229_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_1229_end_mask_0 = const()[name = tensor("op_1229_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1229_cast_fp16 = slice_by_index(begin = var_1229_begin_0, end = var_1229_end_0, end_mask = var_1229_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1229_cast_fp16")]; + tensor var_1233_equation_0 = const()[name = tensor("op_1233_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1233_cast_fp16 = einsum(equation = var_1233_equation_0, values = (var_1155_cast_fp16, var_1112_cast_fp16))[name = tensor("op_1233_cast_fp16")]; + tensor var_1234_to_fp16 = const()[name = tensor("op_1234_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_41_cast_fp16 = mul(x = var_1233_cast_fp16, y = var_1234_to_fp16)[name = tensor("aw_41_cast_fp16")]; + tensor var_1237_equation_0 = const()[name = tensor("op_1237_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1237_cast_fp16 = einsum(equation = var_1237_equation_0, values = (var_1159_cast_fp16, var_1116_cast_fp16))[name = tensor("op_1237_cast_fp16")]; + tensor var_1238_to_fp16 = const()[name = tensor("op_1238_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_43_cast_fp16 = mul(x = var_1237_cast_fp16, y = var_1238_to_fp16)[name = tensor("aw_43_cast_fp16")]; + tensor var_1241_equation_0 = const()[name = tensor("op_1241_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1241_cast_fp16 = einsum(equation = var_1241_equation_0, values = (var_1163_cast_fp16, var_1120_cast_fp16))[name = tensor("op_1241_cast_fp16")]; + tensor var_1242_to_fp16 = const()[name = tensor("op_1242_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_45_cast_fp16 = mul(x = var_1241_cast_fp16, y = var_1242_to_fp16)[name = tensor("aw_45_cast_fp16")]; + tensor var_1245_equation_0 = const()[name = tensor("op_1245_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1245_cast_fp16 = einsum(equation = var_1245_equation_0, values = (var_1167_cast_fp16, var_1124_cast_fp16))[name = tensor("op_1245_cast_fp16")]; + tensor var_1246_to_fp16 = const()[name = tensor("op_1246_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_47_cast_fp16 = mul(x = var_1245_cast_fp16, y = var_1246_to_fp16)[name = tensor("aw_47_cast_fp16")]; + tensor var_1249_equation_0 = const()[name = tensor("op_1249_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1249_cast_fp16 = einsum(equation = var_1249_equation_0, values = (var_1171_cast_fp16, var_1128_cast_fp16))[name = tensor("op_1249_cast_fp16")]; + tensor var_1250_to_fp16 = const()[name = tensor("op_1250_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_49_cast_fp16 = mul(x = var_1249_cast_fp16, y = var_1250_to_fp16)[name = tensor("aw_49_cast_fp16")]; + tensor var_1253_equation_0 = const()[name = tensor("op_1253_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1253_cast_fp16 = einsum(equation = var_1253_equation_0, values = (var_1175_cast_fp16, var_1132_cast_fp16))[name = tensor("op_1253_cast_fp16")]; + tensor var_1254_to_fp16 = const()[name = tensor("op_1254_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_51_cast_fp16 = mul(x = var_1253_cast_fp16, y = var_1254_to_fp16)[name = tensor("aw_51_cast_fp16")]; + tensor var_1257_equation_0 = const()[name = tensor("op_1257_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1257_cast_fp16 = einsum(equation = var_1257_equation_0, values = (var_1179_cast_fp16, var_1136_cast_fp16))[name = tensor("op_1257_cast_fp16")]; + tensor var_1258_to_fp16 = const()[name = tensor("op_1258_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_53_cast_fp16 = mul(x = var_1257_cast_fp16, y = var_1258_to_fp16)[name = tensor("aw_53_cast_fp16")]; + tensor var_1261_equation_0 = const()[name = tensor("op_1261_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1261_cast_fp16 = einsum(equation = var_1261_equation_0, values = (var_1183_cast_fp16, var_1140_cast_fp16))[name = tensor("op_1261_cast_fp16")]; + tensor var_1262_to_fp16 = const()[name = tensor("op_1262_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_55_cast_fp16 = mul(x = var_1261_cast_fp16, y = var_1262_to_fp16)[name = tensor("aw_55_cast_fp16")]; + tensor var_1265_equation_0 = const()[name = tensor("op_1265_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1265_cast_fp16 = einsum(equation = var_1265_equation_0, values = (var_1187_cast_fp16, var_1144_cast_fp16))[name = tensor("op_1265_cast_fp16")]; + tensor var_1266_to_fp16 = const()[name = tensor("op_1266_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_57_cast_fp16 = mul(x = var_1265_cast_fp16, y = var_1266_to_fp16)[name = tensor("aw_57_cast_fp16")]; + tensor var_1269_equation_0 = const()[name = tensor("op_1269_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1269_cast_fp16 = einsum(equation = var_1269_equation_0, values = (var_1191_cast_fp16, var_1148_cast_fp16))[name = tensor("op_1269_cast_fp16")]; + tensor var_1270_to_fp16 = const()[name = tensor("op_1270_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_59_cast_fp16 = mul(x = var_1269_cast_fp16, y = var_1270_to_fp16)[name = tensor("aw_59_cast_fp16")]; + tensor var_1272_cast_fp16 = softmax(axis = var_984, x = aw_41_cast_fp16)[name = tensor("op_1272_cast_fp16")]; + tensor var_1273_cast_fp16 = softmax(axis = var_984, x = aw_43_cast_fp16)[name = tensor("op_1273_cast_fp16")]; + tensor var_1274_cast_fp16 = softmax(axis = var_984, x = aw_45_cast_fp16)[name = tensor("op_1274_cast_fp16")]; + tensor var_1275_cast_fp16 = softmax(axis = var_984, x = aw_47_cast_fp16)[name = tensor("op_1275_cast_fp16")]; + tensor var_1276_cast_fp16 = softmax(axis = var_984, x = aw_49_cast_fp16)[name = tensor("op_1276_cast_fp16")]; + tensor var_1277_cast_fp16 = softmax(axis = var_984, x = aw_51_cast_fp16)[name = tensor("op_1277_cast_fp16")]; + tensor var_1278_cast_fp16 = softmax(axis = var_984, x = aw_53_cast_fp16)[name = tensor("op_1278_cast_fp16")]; + tensor var_1279_cast_fp16 = softmax(axis = var_984, x = aw_55_cast_fp16)[name = tensor("op_1279_cast_fp16")]; + tensor var_1280_cast_fp16 = softmax(axis = var_984, x = aw_57_cast_fp16)[name = tensor("op_1280_cast_fp16")]; + tensor var_1281_cast_fp16 = softmax(axis = var_984, x = aw_59_cast_fp16)[name = tensor("op_1281_cast_fp16")]; + tensor var_1283_equation_0 = const()[name = tensor("op_1283_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1283_cast_fp16 = einsum(equation = var_1283_equation_0, values = (var_1193_cast_fp16, var_1272_cast_fp16))[name = tensor("op_1283_cast_fp16")]; + tensor var_1285_equation_0 = const()[name = tensor("op_1285_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1285_cast_fp16 = einsum(equation = var_1285_equation_0, values = (var_1197_cast_fp16, var_1273_cast_fp16))[name = tensor("op_1285_cast_fp16")]; + tensor var_1287_equation_0 = const()[name = tensor("op_1287_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1287_cast_fp16 = einsum(equation = var_1287_equation_0, values = (var_1201_cast_fp16, var_1274_cast_fp16))[name = tensor("op_1287_cast_fp16")]; + tensor var_1289_equation_0 = const()[name = tensor("op_1289_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1289_cast_fp16 = einsum(equation = var_1289_equation_0, values = (var_1205_cast_fp16, var_1275_cast_fp16))[name = tensor("op_1289_cast_fp16")]; + tensor var_1291_equation_0 = const()[name = tensor("op_1291_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1291_cast_fp16 = einsum(equation = var_1291_equation_0, values = (var_1209_cast_fp16, var_1276_cast_fp16))[name = tensor("op_1291_cast_fp16")]; + tensor var_1293_equation_0 = const()[name = tensor("op_1293_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1293_cast_fp16 = einsum(equation = var_1293_equation_0, values = (var_1213_cast_fp16, var_1277_cast_fp16))[name = tensor("op_1293_cast_fp16")]; + tensor var_1295_equation_0 = const()[name = tensor("op_1295_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1295_cast_fp16 = einsum(equation = var_1295_equation_0, values = (var_1217_cast_fp16, var_1278_cast_fp16))[name = tensor("op_1295_cast_fp16")]; + tensor var_1297_equation_0 = const()[name = tensor("op_1297_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1297_cast_fp16 = einsum(equation = var_1297_equation_0, values = (var_1221_cast_fp16, var_1279_cast_fp16))[name = tensor("op_1297_cast_fp16")]; + tensor var_1299_equation_0 = const()[name = tensor("op_1299_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1299_cast_fp16 = einsum(equation = var_1299_equation_0, values = (var_1225_cast_fp16, var_1280_cast_fp16))[name = tensor("op_1299_cast_fp16")]; + tensor var_1301_equation_0 = const()[name = tensor("op_1301_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1301_cast_fp16 = einsum(equation = var_1301_equation_0, values = (var_1229_cast_fp16, var_1281_cast_fp16))[name = tensor("op_1301_cast_fp16")]; + tensor input_79_interleave_0 = const()[name = tensor("input_79_interleave_0"), val = tensor(false)]; + tensor input_79_cast_fp16 = concat(axis = var_984, interleave = input_79_interleave_0, values = (var_1283_cast_fp16, var_1285_cast_fp16, var_1287_cast_fp16, var_1289_cast_fp16, var_1291_cast_fp16, var_1293_cast_fp16, var_1295_cast_fp16, var_1297_cast_fp16, var_1299_cast_fp16, var_1301_cast_fp16))[name = tensor("input_79_cast_fp16")]; + tensor var_1307 = const()[name = tensor("op_1307"), val = tensor([1, 1])]; + tensor var_1309 = const()[name = tensor("op_1309"), val = tensor([1, 1])]; + tensor var_1311_pad_type_0 = const()[name = tensor("op_1311_pad_type_0"), val = tensor("custom")]; + tensor var_1311_pad_0 = const()[name = tensor("op_1311_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42239488)))]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43058752)))]; + tensor var_1311_cast_fp16 = conv(bias = down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_1309, groups = var_984, pad = var_1311_pad_0, pad_type = var_1311_pad_type_0, strides = var_1307, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_79_cast_fp16)[name = tensor("op_1311_cast_fp16")]; + tensor inputs_15_cast_fp16 = add(x = var_1311_cast_fp16, y = inputs_13_cast_fp16)[name = tensor("inputs_15_cast_fp16")]; + tensor var_1315 = const()[name = tensor("op_1315"), val = tensor([1])]; + tensor channels_mean_15_cast_fp16 = reduce_mean(axes = var_1315, keep_dims = var_979, x = inputs_15_cast_fp16)[name = tensor("channels_mean_15_cast_fp16")]; + tensor zero_mean_15_cast_fp16 = sub(x = inputs_15_cast_fp16, y = channels_mean_15_cast_fp16)[name = tensor("zero_mean_15_cast_fp16")]; + tensor zero_mean_sq_15_cast_fp16 = mul(x = zero_mean_15_cast_fp16, y = zero_mean_15_cast_fp16)[name = tensor("zero_mean_sq_15_cast_fp16")]; + tensor var_1319 = const()[name = tensor("op_1319"), val = tensor([1])]; + tensor var_1320_cast_fp16 = reduce_mean(axes = var_1319, keep_dims = var_979, x = zero_mean_sq_15_cast_fp16)[name = tensor("op_1320_cast_fp16")]; + tensor var_1321_to_fp16 = const()[name = tensor("op_1321_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1322_cast_fp16 = add(x = var_1320_cast_fp16, y = var_1321_to_fp16)[name = tensor("op_1322_cast_fp16")]; + tensor denom_15_epsilon_0_to_fp16 = const()[name = tensor("denom_15_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_15_cast_fp16 = rsqrt(epsilon = denom_15_epsilon_0_to_fp16, x = var_1322_cast_fp16)[name = tensor("denom_15_cast_fp16")]; + tensor out_15_cast_fp16 = mul(x = zero_mean_15_cast_fp16, y = denom_15_cast_fp16)[name = tensor("out_15_cast_fp16")]; + tensor var_1326_to_fp16 = const()[name = tensor("op_1326_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43060096)))]; + tensor var_1327_cast_fp16 = add(x = out_15_cast_fp16, y = var_1326_to_fp16)[name = tensor("op_1327_cast_fp16")]; + tensor var_1329_to_fp16 = const()[name = tensor("op_1329_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43061440)))]; + tensor hidden_states_47_cast_fp16 = mul(x = var_1327_cast_fp16, y = var_1329_to_fp16)[name = tensor("hidden_states_47_cast_fp16")]; + tensor var_1336 = const()[name = tensor("op_1336"), val = tensor([1, 1])]; + tensor var_1338 = const()[name = tensor("op_1338"), val = tensor([1, 1])]; + tensor q_11_pad_type_0 = const()[name = tensor("q_11_pad_type_0"), val = tensor("custom")]; + tensor q_11_pad_0 = const()[name = tensor("q_11_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43062784)))]; + tensor q_11_cast_fp16 = conv(dilations = var_1338, groups = var_984, pad = q_11_pad_0, pad_type = q_11_pad_type_0, strides = var_1336, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_47_cast_fp16)[name = tensor("q_11_cast_fp16")]; + tensor var_1342 = const()[name = tensor("op_1342"), val = tensor([1, 1])]; + tensor var_1344 = const()[name = tensor("op_1344"), val = tensor([1, 1])]; + tensor k_21_pad_type_0 = const()[name = tensor("k_21_pad_type_0"), val = tensor("custom")]; + tensor k_21_pad_0 = const()[name = tensor("k_21_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43882048)))]; + tensor k_21_cast_fp16 = conv(dilations = var_1344, groups = var_984, pad = k_21_pad_0, pad_type = k_21_pad_type_0, strides = var_1342, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_21_cast_fp16")]; + tensor var_1348 = const()[name = tensor("op_1348"), val = tensor([1, 1])]; + tensor var_1350 = const()[name = tensor("op_1350"), val = tensor([1, 1])]; + tensor v_11_pad_type_0 = const()[name = tensor("v_11_pad_type_0"), val = tensor("custom")]; + tensor v_11_pad_0 = const()[name = tensor("v_11_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45192832)))]; + tensor v_11_cast_fp16 = conv(dilations = var_1350, groups = var_984, pad = v_11_pad_0, pad_type = v_11_pad_type_0, strides = var_1348, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_11_cast_fp16")]; + tensor var_1354_begin_0 = const()[name = tensor("op_1354_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_1354_end_0 = const()[name = tensor("op_1354_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_1354_end_mask_0 = const()[name = tensor("op_1354_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1354_cast_fp16 = slice_by_index(begin = var_1354_begin_0, end = var_1354_end_0, end_mask = var_1354_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1354_cast_fp16")]; + tensor var_1358_begin_0 = const()[name = tensor("op_1358_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_1358_end_0 = const()[name = tensor("op_1358_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_1358_end_mask_0 = const()[name = tensor("op_1358_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1358_cast_fp16 = slice_by_index(begin = var_1358_begin_0, end = var_1358_end_0, end_mask = var_1358_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1358_cast_fp16")]; + tensor var_1362_begin_0 = const()[name = tensor("op_1362_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_1362_end_0 = const()[name = tensor("op_1362_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_1362_end_mask_0 = const()[name = tensor("op_1362_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1362_cast_fp16 = slice_by_index(begin = var_1362_begin_0, end = var_1362_end_0, end_mask = var_1362_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1362_cast_fp16")]; + tensor var_1366_begin_0 = const()[name = tensor("op_1366_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_1366_end_0 = const()[name = tensor("op_1366_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_1366_end_mask_0 = const()[name = tensor("op_1366_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1366_cast_fp16 = slice_by_index(begin = var_1366_begin_0, end = var_1366_end_0, end_mask = var_1366_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1366_cast_fp16")]; + tensor var_1370_begin_0 = const()[name = tensor("op_1370_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_1370_end_0 = const()[name = tensor("op_1370_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_1370_end_mask_0 = const()[name = tensor("op_1370_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1370_cast_fp16 = slice_by_index(begin = var_1370_begin_0, end = var_1370_end_0, end_mask = var_1370_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1370_cast_fp16")]; + tensor var_1374_begin_0 = const()[name = tensor("op_1374_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_1374_end_0 = const()[name = tensor("op_1374_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_1374_end_mask_0 = const()[name = tensor("op_1374_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1374_cast_fp16 = slice_by_index(begin = var_1374_begin_0, end = var_1374_end_0, end_mask = var_1374_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1374_cast_fp16")]; + tensor var_1378_begin_0 = const()[name = tensor("op_1378_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_1378_end_0 = const()[name = tensor("op_1378_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_1378_end_mask_0 = const()[name = tensor("op_1378_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1378_cast_fp16 = slice_by_index(begin = var_1378_begin_0, end = var_1378_end_0, end_mask = var_1378_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1378_cast_fp16")]; + tensor var_1382_begin_0 = const()[name = tensor("op_1382_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_1382_end_0 = const()[name = tensor("op_1382_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_1382_end_mask_0 = const()[name = tensor("op_1382_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1382_cast_fp16 = slice_by_index(begin = var_1382_begin_0, end = var_1382_end_0, end_mask = var_1382_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1382_cast_fp16")]; + tensor var_1386_begin_0 = const()[name = tensor("op_1386_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_1386_end_0 = const()[name = tensor("op_1386_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_1386_end_mask_0 = const()[name = tensor("op_1386_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1386_cast_fp16 = slice_by_index(begin = var_1386_begin_0, end = var_1386_end_0, end_mask = var_1386_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1386_cast_fp16")]; + tensor var_1390_begin_0 = const()[name = tensor("op_1390_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_1390_end_0 = const()[name = tensor("op_1390_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_1390_end_mask_0 = const()[name = tensor("op_1390_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1390_cast_fp16 = slice_by_index(begin = var_1390_begin_0, end = var_1390_end_0, end_mask = var_1390_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1390_cast_fp16")]; + tensor k_23_perm_0 = const()[name = tensor("k_23_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_1397_begin_0 = const()[name = tensor("op_1397_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_1397_end_0 = const()[name = tensor("op_1397_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_1397_end_mask_0 = const()[name = tensor("op_1397_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_26 = transpose(perm = k_23_perm_0, x = k_21_cast_fp16)[name = tensor("transpose_26")]; + tensor var_1397_cast_fp16 = slice_by_index(begin = var_1397_begin_0, end = var_1397_end_0, end_mask = var_1397_end_mask_0, x = transpose_26)[name = tensor("op_1397_cast_fp16")]; + tensor var_1401_begin_0 = const()[name = tensor("op_1401_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_1401_end_0 = const()[name = tensor("op_1401_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_1401_end_mask_0 = const()[name = tensor("op_1401_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1401_cast_fp16 = slice_by_index(begin = var_1401_begin_0, end = var_1401_end_0, end_mask = var_1401_end_mask_0, x = transpose_26)[name = tensor("op_1401_cast_fp16")]; + tensor var_1405_begin_0 = const()[name = tensor("op_1405_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_1405_end_0 = const()[name = tensor("op_1405_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_1405_end_mask_0 = const()[name = tensor("op_1405_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1405_cast_fp16 = slice_by_index(begin = var_1405_begin_0, end = var_1405_end_0, end_mask = var_1405_end_mask_0, x = transpose_26)[name = tensor("op_1405_cast_fp16")]; + tensor var_1409_begin_0 = const()[name = tensor("op_1409_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_1409_end_0 = const()[name = tensor("op_1409_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_1409_end_mask_0 = const()[name = tensor("op_1409_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1409_cast_fp16 = slice_by_index(begin = var_1409_begin_0, end = var_1409_end_0, end_mask = var_1409_end_mask_0, x = transpose_26)[name = tensor("op_1409_cast_fp16")]; + tensor var_1413_begin_0 = const()[name = tensor("op_1413_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_1413_end_0 = const()[name = tensor("op_1413_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_1413_end_mask_0 = const()[name = tensor("op_1413_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1413_cast_fp16 = slice_by_index(begin = var_1413_begin_0, end = var_1413_end_0, end_mask = var_1413_end_mask_0, x = transpose_26)[name = tensor("op_1413_cast_fp16")]; + tensor var_1417_begin_0 = const()[name = tensor("op_1417_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_1417_end_0 = const()[name = tensor("op_1417_end_0"), val = tensor([2, 77, 1, 384])]; + tensor var_1417_end_mask_0 = const()[name = tensor("op_1417_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1417_cast_fp16 = slice_by_index(begin = var_1417_begin_0, end = var_1417_end_0, end_mask = var_1417_end_mask_0, x = transpose_26)[name = tensor("op_1417_cast_fp16")]; + tensor var_1421_begin_0 = const()[name = tensor("op_1421_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_1421_end_0 = const()[name = tensor("op_1421_end_0"), val = tensor([2, 77, 1, 448])]; + tensor var_1421_end_mask_0 = const()[name = tensor("op_1421_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1421_cast_fp16 = slice_by_index(begin = var_1421_begin_0, end = var_1421_end_0, end_mask = var_1421_end_mask_0, x = transpose_26)[name = tensor("op_1421_cast_fp16")]; + tensor var_1425_begin_0 = const()[name = tensor("op_1425_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_1425_end_0 = const()[name = tensor("op_1425_end_0"), val = tensor([2, 77, 1, 512])]; + tensor var_1425_end_mask_0 = const()[name = tensor("op_1425_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1425_cast_fp16 = slice_by_index(begin = var_1425_begin_0, end = var_1425_end_0, end_mask = var_1425_end_mask_0, x = transpose_26)[name = tensor("op_1425_cast_fp16")]; + tensor var_1429_begin_0 = const()[name = tensor("op_1429_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_1429_end_0 = const()[name = tensor("op_1429_end_0"), val = tensor([2, 77, 1, 576])]; + tensor var_1429_end_mask_0 = const()[name = tensor("op_1429_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1429_cast_fp16 = slice_by_index(begin = var_1429_begin_0, end = var_1429_end_0, end_mask = var_1429_end_mask_0, x = transpose_26)[name = tensor("op_1429_cast_fp16")]; + tensor var_1433_begin_0 = const()[name = tensor("op_1433_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_1433_end_0 = const()[name = tensor("op_1433_end_0"), val = tensor([2, 77, 1, 640])]; + tensor var_1433_end_mask_0 = const()[name = tensor("op_1433_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1433_cast_fp16 = slice_by_index(begin = var_1433_begin_0, end = var_1433_end_0, end_mask = var_1433_end_mask_0, x = transpose_26)[name = tensor("op_1433_cast_fp16")]; + tensor var_1435_begin_0 = const()[name = tensor("op_1435_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_1435_end_0 = const()[name = tensor("op_1435_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_1435_end_mask_0 = const()[name = tensor("op_1435_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1435_cast_fp16 = slice_by_index(begin = var_1435_begin_0, end = var_1435_end_0, end_mask = var_1435_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1435_cast_fp16")]; + tensor var_1439_begin_0 = const()[name = tensor("op_1439_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_1439_end_0 = const()[name = tensor("op_1439_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_1439_end_mask_0 = const()[name = tensor("op_1439_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1439_cast_fp16 = slice_by_index(begin = var_1439_begin_0, end = var_1439_end_0, end_mask = var_1439_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1439_cast_fp16")]; + tensor var_1443_begin_0 = const()[name = tensor("op_1443_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_1443_end_0 = const()[name = tensor("op_1443_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_1443_end_mask_0 = const()[name = tensor("op_1443_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1443_cast_fp16 = slice_by_index(begin = var_1443_begin_0, end = var_1443_end_0, end_mask = var_1443_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1443_cast_fp16")]; + tensor var_1447_begin_0 = const()[name = tensor("op_1447_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_1447_end_0 = const()[name = tensor("op_1447_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_1447_end_mask_0 = const()[name = tensor("op_1447_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1447_cast_fp16 = slice_by_index(begin = var_1447_begin_0, end = var_1447_end_0, end_mask = var_1447_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1447_cast_fp16")]; + tensor var_1451_begin_0 = const()[name = tensor("op_1451_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_1451_end_0 = const()[name = tensor("op_1451_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_1451_end_mask_0 = const()[name = tensor("op_1451_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1451_cast_fp16 = slice_by_index(begin = var_1451_begin_0, end = var_1451_end_0, end_mask = var_1451_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1451_cast_fp16")]; + tensor var_1455_begin_0 = const()[name = tensor("op_1455_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_1455_end_0 = const()[name = tensor("op_1455_end_0"), val = tensor([2, 384, 1, 77])]; + tensor var_1455_end_mask_0 = const()[name = tensor("op_1455_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1455_cast_fp16 = slice_by_index(begin = var_1455_begin_0, end = var_1455_end_0, end_mask = var_1455_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1455_cast_fp16")]; + tensor var_1459_begin_0 = const()[name = tensor("op_1459_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_1459_end_0 = const()[name = tensor("op_1459_end_0"), val = tensor([2, 448, 1, 77])]; + tensor var_1459_end_mask_0 = const()[name = tensor("op_1459_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1459_cast_fp16 = slice_by_index(begin = var_1459_begin_0, end = var_1459_end_0, end_mask = var_1459_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1459_cast_fp16")]; + tensor var_1463_begin_0 = const()[name = tensor("op_1463_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_1463_end_0 = const()[name = tensor("op_1463_end_0"), val = tensor([2, 512, 1, 77])]; + tensor var_1463_end_mask_0 = const()[name = tensor("op_1463_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1463_cast_fp16 = slice_by_index(begin = var_1463_begin_0, end = var_1463_end_0, end_mask = var_1463_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1463_cast_fp16")]; + tensor var_1467_begin_0 = const()[name = tensor("op_1467_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_1467_end_0 = const()[name = tensor("op_1467_end_0"), val = tensor([2, 576, 1, 77])]; + tensor var_1467_end_mask_0 = const()[name = tensor("op_1467_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1467_cast_fp16 = slice_by_index(begin = var_1467_begin_0, end = var_1467_end_0, end_mask = var_1467_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1467_cast_fp16")]; + tensor var_1471_begin_0 = const()[name = tensor("op_1471_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_1471_end_0 = const()[name = tensor("op_1471_end_0"), val = tensor([2, 640, 1, 77])]; + tensor var_1471_end_mask_0 = const()[name = tensor("op_1471_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1471_cast_fp16 = slice_by_index(begin = var_1471_begin_0, end = var_1471_end_0, end_mask = var_1471_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1471_cast_fp16")]; + tensor var_1475_equation_0 = const()[name = tensor("op_1475_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1475_cast_fp16 = einsum(equation = var_1475_equation_0, values = (var_1397_cast_fp16, var_1354_cast_fp16))[name = tensor("op_1475_cast_fp16")]; + tensor var_1476_to_fp16 = const()[name = tensor("op_1476_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_61_cast_fp16 = mul(x = var_1475_cast_fp16, y = var_1476_to_fp16)[name = tensor("aw_61_cast_fp16")]; + tensor var_1479_equation_0 = const()[name = tensor("op_1479_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1479_cast_fp16 = einsum(equation = var_1479_equation_0, values = (var_1401_cast_fp16, var_1358_cast_fp16))[name = tensor("op_1479_cast_fp16")]; + tensor var_1480_to_fp16 = const()[name = tensor("op_1480_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_63_cast_fp16 = mul(x = var_1479_cast_fp16, y = var_1480_to_fp16)[name = tensor("aw_63_cast_fp16")]; + tensor var_1483_equation_0 = const()[name = tensor("op_1483_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1483_cast_fp16 = einsum(equation = var_1483_equation_0, values = (var_1405_cast_fp16, var_1362_cast_fp16))[name = tensor("op_1483_cast_fp16")]; + tensor var_1484_to_fp16 = const()[name = tensor("op_1484_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_65_cast_fp16 = mul(x = var_1483_cast_fp16, y = var_1484_to_fp16)[name = tensor("aw_65_cast_fp16")]; + tensor var_1487_equation_0 = const()[name = tensor("op_1487_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1487_cast_fp16 = einsum(equation = var_1487_equation_0, values = (var_1409_cast_fp16, var_1366_cast_fp16))[name = tensor("op_1487_cast_fp16")]; + tensor var_1488_to_fp16 = const()[name = tensor("op_1488_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_67_cast_fp16 = mul(x = var_1487_cast_fp16, y = var_1488_to_fp16)[name = tensor("aw_67_cast_fp16")]; + tensor var_1491_equation_0 = const()[name = tensor("op_1491_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1491_cast_fp16 = einsum(equation = var_1491_equation_0, values = (var_1413_cast_fp16, var_1370_cast_fp16))[name = tensor("op_1491_cast_fp16")]; + tensor var_1492_to_fp16 = const()[name = tensor("op_1492_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_69_cast_fp16 = mul(x = var_1491_cast_fp16, y = var_1492_to_fp16)[name = tensor("aw_69_cast_fp16")]; + tensor var_1495_equation_0 = const()[name = tensor("op_1495_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1495_cast_fp16 = einsum(equation = var_1495_equation_0, values = (var_1417_cast_fp16, var_1374_cast_fp16))[name = tensor("op_1495_cast_fp16")]; + tensor var_1496_to_fp16 = const()[name = tensor("op_1496_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_71_cast_fp16 = mul(x = var_1495_cast_fp16, y = var_1496_to_fp16)[name = tensor("aw_71_cast_fp16")]; + tensor var_1499_equation_0 = const()[name = tensor("op_1499_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1499_cast_fp16 = einsum(equation = var_1499_equation_0, values = (var_1421_cast_fp16, var_1378_cast_fp16))[name = tensor("op_1499_cast_fp16")]; + tensor var_1500_to_fp16 = const()[name = tensor("op_1500_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_73_cast_fp16 = mul(x = var_1499_cast_fp16, y = var_1500_to_fp16)[name = tensor("aw_73_cast_fp16")]; + tensor var_1503_equation_0 = const()[name = tensor("op_1503_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1503_cast_fp16 = einsum(equation = var_1503_equation_0, values = (var_1425_cast_fp16, var_1382_cast_fp16))[name = tensor("op_1503_cast_fp16")]; + tensor var_1504_to_fp16 = const()[name = tensor("op_1504_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_75_cast_fp16 = mul(x = var_1503_cast_fp16, y = var_1504_to_fp16)[name = tensor("aw_75_cast_fp16")]; + tensor var_1507_equation_0 = const()[name = tensor("op_1507_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1507_cast_fp16 = einsum(equation = var_1507_equation_0, values = (var_1429_cast_fp16, var_1386_cast_fp16))[name = tensor("op_1507_cast_fp16")]; + tensor var_1508_to_fp16 = const()[name = tensor("op_1508_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_77_cast_fp16 = mul(x = var_1507_cast_fp16, y = var_1508_to_fp16)[name = tensor("aw_77_cast_fp16")]; + tensor var_1511_equation_0 = const()[name = tensor("op_1511_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1511_cast_fp16 = einsum(equation = var_1511_equation_0, values = (var_1433_cast_fp16, var_1390_cast_fp16))[name = tensor("op_1511_cast_fp16")]; + tensor var_1512_to_fp16 = const()[name = tensor("op_1512_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_79_cast_fp16 = mul(x = var_1511_cast_fp16, y = var_1512_to_fp16)[name = tensor("aw_79_cast_fp16")]; + tensor var_1514_cast_fp16 = softmax(axis = var_984, x = aw_61_cast_fp16)[name = tensor("op_1514_cast_fp16")]; + tensor var_1515_cast_fp16 = softmax(axis = var_984, x = aw_63_cast_fp16)[name = tensor("op_1515_cast_fp16")]; + tensor var_1516_cast_fp16 = softmax(axis = var_984, x = aw_65_cast_fp16)[name = tensor("op_1516_cast_fp16")]; + tensor var_1517_cast_fp16 = softmax(axis = var_984, x = aw_67_cast_fp16)[name = tensor("op_1517_cast_fp16")]; + tensor var_1518_cast_fp16 = softmax(axis = var_984, x = aw_69_cast_fp16)[name = tensor("op_1518_cast_fp16")]; + tensor var_1519_cast_fp16 = softmax(axis = var_984, x = aw_71_cast_fp16)[name = tensor("op_1519_cast_fp16")]; + tensor var_1520_cast_fp16 = softmax(axis = var_984, x = aw_73_cast_fp16)[name = tensor("op_1520_cast_fp16")]; + tensor var_1521_cast_fp16 = softmax(axis = var_984, x = aw_75_cast_fp16)[name = tensor("op_1521_cast_fp16")]; + tensor var_1522_cast_fp16 = softmax(axis = var_984, x = aw_77_cast_fp16)[name = tensor("op_1522_cast_fp16")]; + tensor var_1523_cast_fp16 = softmax(axis = var_984, x = aw_79_cast_fp16)[name = tensor("op_1523_cast_fp16")]; + tensor var_1525_equation_0 = const()[name = tensor("op_1525_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1525_cast_fp16 = einsum(equation = var_1525_equation_0, values = (var_1435_cast_fp16, var_1514_cast_fp16))[name = tensor("op_1525_cast_fp16")]; + tensor var_1527_equation_0 = const()[name = tensor("op_1527_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1527_cast_fp16 = einsum(equation = var_1527_equation_0, values = (var_1439_cast_fp16, var_1515_cast_fp16))[name = tensor("op_1527_cast_fp16")]; + tensor var_1529_equation_0 = const()[name = tensor("op_1529_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1529_cast_fp16 = einsum(equation = var_1529_equation_0, values = (var_1443_cast_fp16, var_1516_cast_fp16))[name = tensor("op_1529_cast_fp16")]; + tensor var_1531_equation_0 = const()[name = tensor("op_1531_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1531_cast_fp16 = einsum(equation = var_1531_equation_0, values = (var_1447_cast_fp16, var_1517_cast_fp16))[name = tensor("op_1531_cast_fp16")]; + tensor var_1533_equation_0 = const()[name = tensor("op_1533_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1533_cast_fp16 = einsum(equation = var_1533_equation_0, values = (var_1451_cast_fp16, var_1518_cast_fp16))[name = tensor("op_1533_cast_fp16")]; + tensor var_1535_equation_0 = const()[name = tensor("op_1535_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1535_cast_fp16 = einsum(equation = var_1535_equation_0, values = (var_1455_cast_fp16, var_1519_cast_fp16))[name = tensor("op_1535_cast_fp16")]; + tensor var_1537_equation_0 = const()[name = tensor("op_1537_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1537_cast_fp16 = einsum(equation = var_1537_equation_0, values = (var_1459_cast_fp16, var_1520_cast_fp16))[name = tensor("op_1537_cast_fp16")]; + tensor var_1539_equation_0 = const()[name = tensor("op_1539_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1539_cast_fp16 = einsum(equation = var_1539_equation_0, values = (var_1463_cast_fp16, var_1521_cast_fp16))[name = tensor("op_1539_cast_fp16")]; + tensor var_1541_equation_0 = const()[name = tensor("op_1541_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1541_cast_fp16 = einsum(equation = var_1541_equation_0, values = (var_1467_cast_fp16, var_1522_cast_fp16))[name = tensor("op_1541_cast_fp16")]; + tensor var_1543_equation_0 = const()[name = tensor("op_1543_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1543_cast_fp16 = einsum(equation = var_1543_equation_0, values = (var_1471_cast_fp16, var_1523_cast_fp16))[name = tensor("op_1543_cast_fp16")]; + tensor input_81_interleave_0 = const()[name = tensor("input_81_interleave_0"), val = tensor(false)]; + tensor input_81_cast_fp16 = concat(axis = var_984, interleave = input_81_interleave_0, values = (var_1525_cast_fp16, var_1527_cast_fp16, var_1529_cast_fp16, var_1531_cast_fp16, var_1533_cast_fp16, var_1535_cast_fp16, var_1537_cast_fp16, var_1539_cast_fp16, var_1541_cast_fp16, var_1543_cast_fp16))[name = tensor("input_81_cast_fp16")]; + tensor var_1549 = const()[name = tensor("op_1549"), val = tensor([1, 1])]; + tensor var_1551 = const()[name = tensor("op_1551"), val = tensor([1, 1])]; + tensor var_1553_pad_type_0 = const()[name = tensor("op_1553_pad_type_0"), val = tensor("custom")]; + tensor var_1553_pad_0 = const()[name = tensor("op_1553_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46503616)))]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47322880)))]; + tensor var_1553_cast_fp16 = conv(bias = down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_1551, groups = var_984, pad = var_1553_pad_0, pad_type = var_1553_pad_type_0, strides = var_1549, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_81_cast_fp16)[name = tensor("op_1553_cast_fp16")]; + tensor inputs_17_cast_fp16 = add(x = var_1553_cast_fp16, y = inputs_15_cast_fp16)[name = tensor("inputs_17_cast_fp16")]; + tensor var_1557 = const()[name = tensor("op_1557"), val = tensor([1])]; + tensor channels_mean_17_cast_fp16 = reduce_mean(axes = var_1557, keep_dims = var_979, x = inputs_17_cast_fp16)[name = tensor("channels_mean_17_cast_fp16")]; + tensor zero_mean_17_cast_fp16 = sub(x = inputs_17_cast_fp16, y = channels_mean_17_cast_fp16)[name = tensor("zero_mean_17_cast_fp16")]; + tensor zero_mean_sq_17_cast_fp16 = mul(x = zero_mean_17_cast_fp16, y = zero_mean_17_cast_fp16)[name = tensor("zero_mean_sq_17_cast_fp16")]; + tensor var_1561 = const()[name = tensor("op_1561"), val = tensor([1])]; + tensor var_1562_cast_fp16 = reduce_mean(axes = var_1561, keep_dims = var_979, x = zero_mean_sq_17_cast_fp16)[name = tensor("op_1562_cast_fp16")]; + tensor var_1563_to_fp16 = const()[name = tensor("op_1563_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1564_cast_fp16 = add(x = var_1562_cast_fp16, y = var_1563_to_fp16)[name = tensor("op_1564_cast_fp16")]; + tensor denom_17_epsilon_0_to_fp16 = const()[name = tensor("denom_17_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_17_cast_fp16 = rsqrt(epsilon = denom_17_epsilon_0_to_fp16, x = var_1564_cast_fp16)[name = tensor("denom_17_cast_fp16")]; + tensor out_17_cast_fp16 = mul(x = zero_mean_17_cast_fp16, y = denom_17_cast_fp16)[name = tensor("out_17_cast_fp16")]; + tensor var_1568_to_fp16 = const()[name = tensor("op_1568_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47324224)))]; + tensor var_1569_cast_fp16 = add(x = out_17_cast_fp16, y = var_1568_to_fp16)[name = tensor("op_1569_cast_fp16")]; + tensor var_1571_to_fp16 = const()[name = tensor("op_1571_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47325568)))]; + tensor input_83_cast_fp16 = mul(x = var_1569_cast_fp16, y = var_1571_to_fp16)[name = tensor("input_83_cast_fp16")]; + tensor var_1579 = const()[name = tensor("op_1579"), val = tensor([1, 1])]; + tensor var_1581 = const()[name = tensor("op_1581"), val = tensor([1, 1])]; + tensor var_1583_pad_type_0 = const()[name = tensor("op_1583_pad_type_0"), val = tensor("custom")]; + tensor var_1583_pad_0 = const()[name = tensor("op_1583_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47326912)))]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53880576)))]; + tensor var_1583_cast_fp16 = conv(bias = down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_1581, groups = var_984, pad = var_1583_pad_0, pad_type = var_1583_pad_type_0, strides = var_1579, weight = down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_83_cast_fp16)[name = tensor("op_1583_cast_fp16")]; + tensor var_1584_split_sizes_0 = const()[name = tensor("op_1584_split_sizes_0"), val = tensor([2560, 2560])]; + tensor var_1584_axis_0 = const()[name = tensor("op_1584_axis_0"), val = tensor(1)]; + tensor var_1584_cast_fp16_0, tensor var_1584_cast_fp16_1 = split(axis = var_1584_axis_0, split_sizes = var_1584_split_sizes_0, x = var_1583_cast_fp16)[name = tensor("op_1584_cast_fp16")]; + tensor var_1586_mode_0 = const()[name = tensor("op_1586_mode_0"), val = tensor("EXACT")]; + tensor var_1586_cast_fp16 = gelu(mode = var_1586_mode_0, x = var_1584_cast_fp16_1)[name = tensor("op_1586_cast_fp16")]; + tensor input_85_cast_fp16 = mul(x = var_1584_cast_fp16_0, y = var_1586_cast_fp16)[name = tensor("input_85_cast_fp16")]; + tensor var_1590 = const()[name = tensor("op_1590"), val = tensor([1, 1])]; + tensor var_1592 = const()[name = tensor("op_1592"), val = tensor([1, 1])]; + tensor var_1594_pad_type_0 = const()[name = tensor("op_1594_pad_type_0"), val = tensor("custom")]; + tensor var_1594_pad_0 = const()[name = tensor("op_1594_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53890880)))]; + tensor down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57167744)))]; + tensor var_1594_cast_fp16 = conv(bias = down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_1592, groups = var_984, pad = var_1594_pad_0, pad_type = var_1594_pad_type_0, strides = var_1590, weight = down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_85_cast_fp16)[name = tensor("op_1594_cast_fp16")]; + tensor hidden_states_51_cast_fp16 = add(x = var_1594_cast_fp16, y = inputs_17_cast_fp16)[name = tensor("hidden_states_51_cast_fp16")]; + tensor var_1596 = const()[name = tensor("op_1596"), val = tensor([2, 640, 24, 24])]; + tensor input_87_cast_fp16 = reshape(shape = var_1596, x = hidden_states_51_cast_fp16)[name = tensor("input_87_cast_fp16")]; + tensor var_1600 = const()[name = tensor("op_1600"), val = tensor([1, 1])]; + tensor var_1602 = const()[name = tensor("op_1602"), val = tensor([1, 1])]; + tensor hidden_states_53_pad_type_0 = const()[name = tensor("hidden_states_53_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_53_pad_0 = const()[name = tensor("hidden_states_53_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_0_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57169088)))]; + tensor down_blocks_1_attentions_0_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57988352)))]; + tensor hidden_states_53_cast_fp16 = conv(bias = down_blocks_1_attentions_0_proj_out_bias_to_fp16, dilations = var_1602, groups = var_984, pad = hidden_states_53_pad_0, pad_type = hidden_states_53_pad_type_0, strides = var_1600, weight = down_blocks_1_attentions_0_proj_out_weight_to_fp16, x = input_87_cast_fp16)[name = tensor("hidden_states_53_cast_fp16")]; + tensor input_89_cast_fp16 = add(x = hidden_states_53_cast_fp16, y = hidden_states_41_cast_fp16)[name = tensor("input_89_cast_fp16")]; + tensor reshape_36_shape_0 = const()[name = tensor("reshape_36_shape_0"), val = tensor([2, 32, 20, 24, 24])]; + tensor reshape_36_cast_fp16 = reshape(shape = reshape_36_shape_0, x = input_89_cast_fp16)[name = tensor("reshape_36_cast_fp16")]; + tensor reduce_mean_27_axes_0 = const()[name = tensor("reduce_mean_27_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_27_keep_dims_0 = const()[name = tensor("reduce_mean_27_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_27_cast_fp16 = reduce_mean(axes = reduce_mean_27_axes_0, keep_dims = reduce_mean_27_keep_dims_0, x = reshape_36_cast_fp16)[name = tensor("reduce_mean_27_cast_fp16")]; + tensor sub_18_cast_fp16 = sub(x = reshape_36_cast_fp16, y = reduce_mean_27_cast_fp16)[name = tensor("sub_18_cast_fp16")]; + tensor square_9_cast_fp16 = square(x = sub_18_cast_fp16)[name = tensor("square_9_cast_fp16")]; + tensor reduce_mean_29_axes_0 = const()[name = tensor("reduce_mean_29_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_29_keep_dims_0 = const()[name = tensor("reduce_mean_29_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_29_cast_fp16 = reduce_mean(axes = reduce_mean_29_axes_0, keep_dims = reduce_mean_29_keep_dims_0, x = square_9_cast_fp16)[name = tensor("reduce_mean_29_cast_fp16")]; + tensor add_18_y_0_to_fp16 = const()[name = tensor("add_18_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_18_cast_fp16 = add(x = reduce_mean_29_cast_fp16, y = add_18_y_0_to_fp16)[name = tensor("add_18_cast_fp16")]; + tensor sqrt_9_cast_fp16 = sqrt(x = add_18_cast_fp16)[name = tensor("sqrt_9_cast_fp16")]; + tensor real_div_9_cast_fp16 = real_div(x = sub_18_cast_fp16, y = sqrt_9_cast_fp16)[name = tensor("real_div_9_cast_fp16")]; + tensor reshape_37_shape_0 = const()[name = tensor("reshape_37_shape_0"), val = tensor([2, 640, 24, 24])]; + tensor reshape_37_cast_fp16 = reshape(shape = reshape_37_shape_0, x = real_div_9_cast_fp16)[name = tensor("reshape_37_cast_fp16")]; + tensor add_19_gamma_0_to_fp16 = const()[name = tensor("add_19_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57989696)))]; + tensor add_19_beta_0_to_fp16 = const()[name = tensor("add_19_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57991040)))]; + tensor add_19_epsilon_0_to_fp16 = const()[name = tensor("add_19_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_19_cast_fp16 = batch_norm(beta = add_19_beta_0_to_fp16, epsilon = add_19_epsilon_0_to_fp16, gamma = add_19_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_37_cast_fp16)[name = tensor("add_19_cast_fp16")]; + tensor input_93_cast_fp16 = silu(x = add_19_cast_fp16)[name = tensor("input_93_cast_fp16")]; + tensor var_1617 = const()[name = tensor("op_1617"), val = tensor([1, 1])]; + tensor var_1619 = const()[name = tensor("op_1619"), val = tensor([1, 1])]; + tensor hidden_states_55_pad_type_0 = const()[name = tensor("hidden_states_55_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_55_pad_0 = const()[name = tensor("hidden_states_55_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_1_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57992384)))]; + tensor down_blocks_1_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65365248)))]; + tensor hidden_states_55_cast_fp16 = conv(bias = down_blocks_1_resnets_1_conv1_bias_to_fp16, dilations = var_1619, groups = var_984, pad = hidden_states_55_pad_0, pad_type = hidden_states_55_pad_type_0, strides = var_1617, weight = down_blocks_1_resnets_1_conv1_weight_to_fp16, x = input_93_cast_fp16)[name = tensor("hidden_states_55_cast_fp16")]; + tensor var_1625 = const()[name = tensor("op_1625"), val = tensor([1, 1])]; + tensor var_1627 = const()[name = tensor("op_1627"), val = tensor([1, 1])]; + tensor temb_7_pad_type_0 = const()[name = tensor("temb_7_pad_type_0"), val = tensor("custom")]; + tensor temb_7_pad_0 = const()[name = tensor("temb_7_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65366592)))]; + tensor down_blocks_1_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67005056)))]; + tensor temb_7_cast_fp16 = conv(bias = down_blocks_1_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_1627, groups = var_984, pad = temb_7_pad_0, pad_type = temb_7_pad_type_0, strides = var_1625, weight = down_blocks_1_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_7_cast_fp16")]; + tensor input_97_cast_fp16 = add(x = hidden_states_55_cast_fp16, y = temb_7_cast_fp16)[name = tensor("input_97_cast_fp16")]; + tensor reshape_40_shape_0 = const()[name = tensor("reshape_40_shape_0"), val = tensor([2, 32, 20, 24, 24])]; + tensor reshape_40_cast_fp16 = reshape(shape = reshape_40_shape_0, x = input_97_cast_fp16)[name = tensor("reshape_40_cast_fp16")]; + tensor reduce_mean_30_axes_0 = const()[name = tensor("reduce_mean_30_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_30_keep_dims_0 = const()[name = tensor("reduce_mean_30_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_30_cast_fp16 = reduce_mean(axes = reduce_mean_30_axes_0, keep_dims = reduce_mean_30_keep_dims_0, x = reshape_40_cast_fp16)[name = tensor("reduce_mean_30_cast_fp16")]; + tensor sub_20_cast_fp16 = sub(x = reshape_40_cast_fp16, y = reduce_mean_30_cast_fp16)[name = tensor("sub_20_cast_fp16")]; + tensor square_10_cast_fp16 = square(x = sub_20_cast_fp16)[name = tensor("square_10_cast_fp16")]; + tensor reduce_mean_32_axes_0 = const()[name = tensor("reduce_mean_32_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_32_keep_dims_0 = const()[name = tensor("reduce_mean_32_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_32_cast_fp16 = reduce_mean(axes = reduce_mean_32_axes_0, keep_dims = reduce_mean_32_keep_dims_0, x = square_10_cast_fp16)[name = tensor("reduce_mean_32_cast_fp16")]; + tensor add_20_y_0_to_fp16 = const()[name = tensor("add_20_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_20_cast_fp16 = add(x = reduce_mean_32_cast_fp16, y = add_20_y_0_to_fp16)[name = tensor("add_20_cast_fp16")]; + tensor sqrt_10_cast_fp16 = sqrt(x = add_20_cast_fp16)[name = tensor("sqrt_10_cast_fp16")]; + tensor real_div_10_cast_fp16 = real_div(x = sub_20_cast_fp16, y = sqrt_10_cast_fp16)[name = tensor("real_div_10_cast_fp16")]; + tensor reshape_41_shape_0 = const()[name = tensor("reshape_41_shape_0"), val = tensor([2, 640, 24, 24])]; + tensor reshape_41_cast_fp16 = reshape(shape = reshape_41_shape_0, x = real_div_10_cast_fp16)[name = tensor("reshape_41_cast_fp16")]; + tensor add_21_gamma_0_to_fp16 = const()[name = tensor("add_21_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67006400)))]; + tensor add_21_beta_0_to_fp16 = const()[name = tensor("add_21_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67007744)))]; + tensor add_21_epsilon_0_to_fp16 = const()[name = tensor("add_21_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_21_cast_fp16 = batch_norm(beta = add_21_beta_0_to_fp16, epsilon = add_21_epsilon_0_to_fp16, gamma = add_21_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_41_cast_fp16)[name = tensor("add_21_cast_fp16")]; + tensor input_101_cast_fp16 = silu(x = add_21_cast_fp16)[name = tensor("input_101_cast_fp16")]; + tensor var_1637 = const()[name = tensor("op_1637"), val = tensor([1, 1])]; + tensor var_1639 = const()[name = tensor("op_1639"), val = tensor([1, 1])]; + tensor hidden_states_57_pad_type_0 = const()[name = tensor("hidden_states_57_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_57_pad_0 = const()[name = tensor("hidden_states_57_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_1_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67009088)))]; + tensor down_blocks_1_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(74381952)))]; + tensor hidden_states_57_cast_fp16 = conv(bias = down_blocks_1_resnets_1_conv2_bias_to_fp16, dilations = var_1639, groups = var_984, pad = hidden_states_57_pad_0, pad_type = hidden_states_57_pad_type_0, strides = var_1637, weight = down_blocks_1_resnets_1_conv2_weight_to_fp16, x = input_101_cast_fp16)[name = tensor("hidden_states_57_cast_fp16")]; + tensor hidden_states_59_cast_fp16 = add(x = input_89_cast_fp16, y = hidden_states_57_cast_fp16)[name = tensor("hidden_states_59_cast_fp16")]; + tensor reshape_44_shape_0 = const()[name = tensor("reshape_44_shape_0"), val = tensor([2, 32, 20, 24, 24])]; + tensor reshape_44_cast_fp16 = reshape(shape = reshape_44_shape_0, x = hidden_states_59_cast_fp16)[name = tensor("reshape_44_cast_fp16")]; + tensor reduce_mean_33_axes_0 = const()[name = tensor("reduce_mean_33_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_33_keep_dims_0 = const()[name = tensor("reduce_mean_33_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_33_cast_fp16 = reduce_mean(axes = reduce_mean_33_axes_0, keep_dims = reduce_mean_33_keep_dims_0, x = reshape_44_cast_fp16)[name = tensor("reduce_mean_33_cast_fp16")]; + tensor sub_22_cast_fp16 = sub(x = reshape_44_cast_fp16, y = reduce_mean_33_cast_fp16)[name = tensor("sub_22_cast_fp16")]; + tensor square_11_cast_fp16 = square(x = sub_22_cast_fp16)[name = tensor("square_11_cast_fp16")]; + tensor reduce_mean_35_axes_0 = const()[name = tensor("reduce_mean_35_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_35_keep_dims_0 = const()[name = tensor("reduce_mean_35_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_35_cast_fp16 = reduce_mean(axes = reduce_mean_35_axes_0, keep_dims = reduce_mean_35_keep_dims_0, x = square_11_cast_fp16)[name = tensor("reduce_mean_35_cast_fp16")]; + tensor add_22_y_0_to_fp16 = const()[name = tensor("add_22_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_22_cast_fp16 = add(x = reduce_mean_35_cast_fp16, y = add_22_y_0_to_fp16)[name = tensor("add_22_cast_fp16")]; + tensor sqrt_11_cast_fp16 = sqrt(x = add_22_cast_fp16)[name = tensor("sqrt_11_cast_fp16")]; + tensor real_div_11_cast_fp16 = real_div(x = sub_22_cast_fp16, y = sqrt_11_cast_fp16)[name = tensor("real_div_11_cast_fp16")]; + tensor reshape_45_shape_0 = const()[name = tensor("reshape_45_shape_0"), val = tensor([2, 640, 24, 24])]; + tensor reshape_45_cast_fp16 = reshape(shape = reshape_45_shape_0, x = real_div_11_cast_fp16)[name = tensor("reshape_45_cast_fp16")]; + tensor add_23_gamma_0_to_fp16 = const()[name = tensor("add_23_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(74383296)))]; + tensor add_23_beta_0_to_fp16 = const()[name = tensor("add_23_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(74384640)))]; + tensor add_23_epsilon_0_to_fp16 = const()[name = tensor("add_23_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_23_cast_fp16 = batch_norm(beta = add_23_beta_0_to_fp16, epsilon = add_23_epsilon_0_to_fp16, gamma = add_23_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_45_cast_fp16)[name = tensor("add_23_cast_fp16")]; + tensor var_1659 = const()[name = tensor("op_1659"), val = tensor([1, 1])]; + tensor var_1661 = const()[name = tensor("op_1661"), val = tensor([1, 1])]; + tensor hidden_states_61_pad_type_0 = const()[name = tensor("hidden_states_61_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_61_pad_0 = const()[name = tensor("hidden_states_61_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(74385984)))]; + tensor down_blocks_1_attentions_1_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75205248)))]; + tensor hidden_states_61_cast_fp16 = conv(bias = down_blocks_1_attentions_1_proj_in_bias_to_fp16, dilations = var_1661, groups = var_984, pad = hidden_states_61_pad_0, pad_type = hidden_states_61_pad_type_0, strides = var_1659, weight = down_blocks_1_attentions_1_proj_in_weight_to_fp16, x = add_23_cast_fp16)[name = tensor("hidden_states_61_cast_fp16")]; + tensor var_1666 = const()[name = tensor("op_1666"), val = tensor([2, 640, 1, 576])]; + tensor inputs_19_cast_fp16 = reshape(shape = var_1666, x = hidden_states_61_cast_fp16)[name = tensor("inputs_19_cast_fp16")]; + tensor var_1676 = const()[name = tensor("op_1676"), val = tensor([1])]; + tensor channels_mean_19_cast_fp16 = reduce_mean(axes = var_1676, keep_dims = var_979, x = inputs_19_cast_fp16)[name = tensor("channels_mean_19_cast_fp16")]; + tensor zero_mean_19_cast_fp16 = sub(x = inputs_19_cast_fp16, y = channels_mean_19_cast_fp16)[name = tensor("zero_mean_19_cast_fp16")]; + tensor zero_mean_sq_19_cast_fp16 = mul(x = zero_mean_19_cast_fp16, y = zero_mean_19_cast_fp16)[name = tensor("zero_mean_sq_19_cast_fp16")]; + tensor var_1680 = const()[name = tensor("op_1680"), val = tensor([1])]; + tensor var_1681_cast_fp16 = reduce_mean(axes = var_1680, keep_dims = var_979, x = zero_mean_sq_19_cast_fp16)[name = tensor("op_1681_cast_fp16")]; + tensor var_1682_to_fp16 = const()[name = tensor("op_1682_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1683_cast_fp16 = add(x = var_1681_cast_fp16, y = var_1682_to_fp16)[name = tensor("op_1683_cast_fp16")]; + tensor denom_19_epsilon_0_to_fp16 = const()[name = tensor("denom_19_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_19_cast_fp16 = rsqrt(epsilon = denom_19_epsilon_0_to_fp16, x = var_1683_cast_fp16)[name = tensor("denom_19_cast_fp16")]; + tensor out_19_cast_fp16 = mul(x = zero_mean_19_cast_fp16, y = denom_19_cast_fp16)[name = tensor("out_19_cast_fp16")]; + tensor var_1687_to_fp16 = const()[name = tensor("op_1687_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75206592)))]; + tensor var_1688_cast_fp16 = add(x = out_19_cast_fp16, y = var_1687_to_fp16)[name = tensor("op_1688_cast_fp16")]; + tensor var_1690_to_fp16 = const()[name = tensor("op_1690_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75207936)))]; + tensor hidden_states_63_cast_fp16 = mul(x = var_1688_cast_fp16, y = var_1690_to_fp16)[name = tensor("hidden_states_63_cast_fp16")]; + tensor var_1697 = const()[name = tensor("op_1697"), val = tensor([1, 1])]; + tensor var_1699 = const()[name = tensor("op_1699"), val = tensor([1, 1])]; + tensor q_13_pad_type_0 = const()[name = tensor("q_13_pad_type_0"), val = tensor("custom")]; + tensor q_13_pad_0 = const()[name = tensor("q_13_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75209280)))]; + tensor q_13_cast_fp16 = conv(dilations = var_1699, groups = var_984, pad = q_13_pad_0, pad_type = q_13_pad_type_0, strides = var_1697, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_63_cast_fp16)[name = tensor("q_13_cast_fp16")]; + tensor var_1703 = const()[name = tensor("op_1703"), val = tensor([1, 1])]; + tensor var_1705 = const()[name = tensor("op_1705"), val = tensor([1, 1])]; + tensor k_25_pad_type_0 = const()[name = tensor("k_25_pad_type_0"), val = tensor("custom")]; + tensor k_25_pad_0 = const()[name = tensor("k_25_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(76028544)))]; + tensor k_25_cast_fp16 = conv(dilations = var_1705, groups = var_984, pad = k_25_pad_0, pad_type = k_25_pad_type_0, strides = var_1703, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_63_cast_fp16)[name = tensor("k_25_cast_fp16")]; + tensor var_1709 = const()[name = tensor("op_1709"), val = tensor([1, 1])]; + tensor var_1711 = const()[name = tensor("op_1711"), val = tensor([1, 1])]; + tensor v_13_pad_type_0 = const()[name = tensor("v_13_pad_type_0"), val = tensor("custom")]; + tensor v_13_pad_0 = const()[name = tensor("v_13_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(76847808)))]; + tensor v_13_cast_fp16 = conv(dilations = var_1711, groups = var_984, pad = v_13_pad_0, pad_type = v_13_pad_type_0, strides = var_1709, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_63_cast_fp16)[name = tensor("v_13_cast_fp16")]; + tensor var_1715_begin_0 = const()[name = tensor("op_1715_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_1715_end_0 = const()[name = tensor("op_1715_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_1715_end_mask_0 = const()[name = tensor("op_1715_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1715_cast_fp16 = slice_by_index(begin = var_1715_begin_0, end = var_1715_end_0, end_mask = var_1715_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1715_cast_fp16")]; + tensor var_1719_begin_0 = const()[name = tensor("op_1719_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_1719_end_0 = const()[name = tensor("op_1719_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_1719_end_mask_0 = const()[name = tensor("op_1719_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1719_cast_fp16 = slice_by_index(begin = var_1719_begin_0, end = var_1719_end_0, end_mask = var_1719_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1719_cast_fp16")]; + tensor var_1723_begin_0 = const()[name = tensor("op_1723_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_1723_end_0 = const()[name = tensor("op_1723_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_1723_end_mask_0 = const()[name = tensor("op_1723_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1723_cast_fp16 = slice_by_index(begin = var_1723_begin_0, end = var_1723_end_0, end_mask = var_1723_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1723_cast_fp16")]; + tensor var_1727_begin_0 = const()[name = tensor("op_1727_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_1727_end_0 = const()[name = tensor("op_1727_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_1727_end_mask_0 = const()[name = tensor("op_1727_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1727_cast_fp16 = slice_by_index(begin = var_1727_begin_0, end = var_1727_end_0, end_mask = var_1727_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1727_cast_fp16")]; + tensor var_1731_begin_0 = const()[name = tensor("op_1731_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_1731_end_0 = const()[name = tensor("op_1731_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_1731_end_mask_0 = const()[name = tensor("op_1731_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1731_cast_fp16 = slice_by_index(begin = var_1731_begin_0, end = var_1731_end_0, end_mask = var_1731_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1731_cast_fp16")]; + tensor var_1735_begin_0 = const()[name = tensor("op_1735_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_1735_end_0 = const()[name = tensor("op_1735_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_1735_end_mask_0 = const()[name = tensor("op_1735_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1735_cast_fp16 = slice_by_index(begin = var_1735_begin_0, end = var_1735_end_0, end_mask = var_1735_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1735_cast_fp16")]; + tensor var_1739_begin_0 = const()[name = tensor("op_1739_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_1739_end_0 = const()[name = tensor("op_1739_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_1739_end_mask_0 = const()[name = tensor("op_1739_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1739_cast_fp16 = slice_by_index(begin = var_1739_begin_0, end = var_1739_end_0, end_mask = var_1739_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1739_cast_fp16")]; + tensor var_1743_begin_0 = const()[name = tensor("op_1743_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_1743_end_0 = const()[name = tensor("op_1743_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_1743_end_mask_0 = const()[name = tensor("op_1743_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1743_cast_fp16 = slice_by_index(begin = var_1743_begin_0, end = var_1743_end_0, end_mask = var_1743_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1743_cast_fp16")]; + tensor var_1747_begin_0 = const()[name = tensor("op_1747_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_1747_end_0 = const()[name = tensor("op_1747_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_1747_end_mask_0 = const()[name = tensor("op_1747_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1747_cast_fp16 = slice_by_index(begin = var_1747_begin_0, end = var_1747_end_0, end_mask = var_1747_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1747_cast_fp16")]; + tensor var_1751_begin_0 = const()[name = tensor("op_1751_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_1751_end_0 = const()[name = tensor("op_1751_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_1751_end_mask_0 = const()[name = tensor("op_1751_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1751_cast_fp16 = slice_by_index(begin = var_1751_begin_0, end = var_1751_end_0, end_mask = var_1751_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1751_cast_fp16")]; + tensor k_27_perm_0 = const()[name = tensor("k_27_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_1758_begin_0 = const()[name = tensor("op_1758_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_1758_end_0 = const()[name = tensor("op_1758_end_0"), val = tensor([2, 576, 1, 64])]; + tensor var_1758_end_mask_0 = const()[name = tensor("op_1758_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_25 = transpose(perm = k_27_perm_0, x = k_25_cast_fp16)[name = tensor("transpose_25")]; + tensor var_1758_cast_fp16 = slice_by_index(begin = var_1758_begin_0, end = var_1758_end_0, end_mask = var_1758_end_mask_0, x = transpose_25)[name = tensor("op_1758_cast_fp16")]; + tensor var_1762_begin_0 = const()[name = tensor("op_1762_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_1762_end_0 = const()[name = tensor("op_1762_end_0"), val = tensor([2, 576, 1, 128])]; + tensor var_1762_end_mask_0 = const()[name = tensor("op_1762_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1762_cast_fp16 = slice_by_index(begin = var_1762_begin_0, end = var_1762_end_0, end_mask = var_1762_end_mask_0, x = transpose_25)[name = tensor("op_1762_cast_fp16")]; + tensor var_1766_begin_0 = const()[name = tensor("op_1766_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_1766_end_0 = const()[name = tensor("op_1766_end_0"), val = tensor([2, 576, 1, 192])]; + tensor var_1766_end_mask_0 = const()[name = tensor("op_1766_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1766_cast_fp16 = slice_by_index(begin = var_1766_begin_0, end = var_1766_end_0, end_mask = var_1766_end_mask_0, x = transpose_25)[name = tensor("op_1766_cast_fp16")]; + tensor var_1770_begin_0 = const()[name = tensor("op_1770_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_1770_end_0 = const()[name = tensor("op_1770_end_0"), val = tensor([2, 576, 1, 256])]; + tensor var_1770_end_mask_0 = const()[name = tensor("op_1770_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1770_cast_fp16 = slice_by_index(begin = var_1770_begin_0, end = var_1770_end_0, end_mask = var_1770_end_mask_0, x = transpose_25)[name = tensor("op_1770_cast_fp16")]; + tensor var_1774_begin_0 = const()[name = tensor("op_1774_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_1774_end_0 = const()[name = tensor("op_1774_end_0"), val = tensor([2, 576, 1, 320])]; + tensor var_1774_end_mask_0 = const()[name = tensor("op_1774_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1774_cast_fp16 = slice_by_index(begin = var_1774_begin_0, end = var_1774_end_0, end_mask = var_1774_end_mask_0, x = transpose_25)[name = tensor("op_1774_cast_fp16")]; + tensor var_1778_begin_0 = const()[name = tensor("op_1778_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_1778_end_0 = const()[name = tensor("op_1778_end_0"), val = tensor([2, 576, 1, 384])]; + tensor var_1778_end_mask_0 = const()[name = tensor("op_1778_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1778_cast_fp16 = slice_by_index(begin = var_1778_begin_0, end = var_1778_end_0, end_mask = var_1778_end_mask_0, x = transpose_25)[name = tensor("op_1778_cast_fp16")]; + tensor var_1782_begin_0 = const()[name = tensor("op_1782_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_1782_end_0 = const()[name = tensor("op_1782_end_0"), val = tensor([2, 576, 1, 448])]; + tensor var_1782_end_mask_0 = const()[name = tensor("op_1782_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1782_cast_fp16 = slice_by_index(begin = var_1782_begin_0, end = var_1782_end_0, end_mask = var_1782_end_mask_0, x = transpose_25)[name = tensor("op_1782_cast_fp16")]; + tensor var_1786_begin_0 = const()[name = tensor("op_1786_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_1786_end_0 = const()[name = tensor("op_1786_end_0"), val = tensor([2, 576, 1, 512])]; + tensor var_1786_end_mask_0 = const()[name = tensor("op_1786_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1786_cast_fp16 = slice_by_index(begin = var_1786_begin_0, end = var_1786_end_0, end_mask = var_1786_end_mask_0, x = transpose_25)[name = tensor("op_1786_cast_fp16")]; + tensor var_1790_begin_0 = const()[name = tensor("op_1790_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_1790_end_0 = const()[name = tensor("op_1790_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_1790_end_mask_0 = const()[name = tensor("op_1790_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1790_cast_fp16 = slice_by_index(begin = var_1790_begin_0, end = var_1790_end_0, end_mask = var_1790_end_mask_0, x = transpose_25)[name = tensor("op_1790_cast_fp16")]; + tensor var_1794_begin_0 = const()[name = tensor("op_1794_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_1794_end_0 = const()[name = tensor("op_1794_end_0"), val = tensor([2, 576, 1, 640])]; + tensor var_1794_end_mask_0 = const()[name = tensor("op_1794_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_1794_cast_fp16 = slice_by_index(begin = var_1794_begin_0, end = var_1794_end_0, end_mask = var_1794_end_mask_0, x = transpose_25)[name = tensor("op_1794_cast_fp16")]; + tensor var_1796_begin_0 = const()[name = tensor("op_1796_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_1796_end_0 = const()[name = tensor("op_1796_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_1796_end_mask_0 = const()[name = tensor("op_1796_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1796_cast_fp16 = slice_by_index(begin = var_1796_begin_0, end = var_1796_end_0, end_mask = var_1796_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1796_cast_fp16")]; + tensor var_1800_begin_0 = const()[name = tensor("op_1800_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_1800_end_0 = const()[name = tensor("op_1800_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_1800_end_mask_0 = const()[name = tensor("op_1800_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1800_cast_fp16 = slice_by_index(begin = var_1800_begin_0, end = var_1800_end_0, end_mask = var_1800_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1800_cast_fp16")]; + tensor var_1804_begin_0 = const()[name = tensor("op_1804_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_1804_end_0 = const()[name = tensor("op_1804_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_1804_end_mask_0 = const()[name = tensor("op_1804_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1804_cast_fp16 = slice_by_index(begin = var_1804_begin_0, end = var_1804_end_0, end_mask = var_1804_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1804_cast_fp16")]; + tensor var_1808_begin_0 = const()[name = tensor("op_1808_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_1808_end_0 = const()[name = tensor("op_1808_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_1808_end_mask_0 = const()[name = tensor("op_1808_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1808_cast_fp16 = slice_by_index(begin = var_1808_begin_0, end = var_1808_end_0, end_mask = var_1808_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1808_cast_fp16")]; + tensor var_1812_begin_0 = const()[name = tensor("op_1812_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_1812_end_0 = const()[name = tensor("op_1812_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_1812_end_mask_0 = const()[name = tensor("op_1812_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1812_cast_fp16 = slice_by_index(begin = var_1812_begin_0, end = var_1812_end_0, end_mask = var_1812_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1812_cast_fp16")]; + tensor var_1816_begin_0 = const()[name = tensor("op_1816_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_1816_end_0 = const()[name = tensor("op_1816_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_1816_end_mask_0 = const()[name = tensor("op_1816_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1816_cast_fp16 = slice_by_index(begin = var_1816_begin_0, end = var_1816_end_0, end_mask = var_1816_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1816_cast_fp16")]; + tensor var_1820_begin_0 = const()[name = tensor("op_1820_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_1820_end_0 = const()[name = tensor("op_1820_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_1820_end_mask_0 = const()[name = tensor("op_1820_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1820_cast_fp16 = slice_by_index(begin = var_1820_begin_0, end = var_1820_end_0, end_mask = var_1820_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1820_cast_fp16")]; + tensor var_1824_begin_0 = const()[name = tensor("op_1824_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_1824_end_0 = const()[name = tensor("op_1824_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_1824_end_mask_0 = const()[name = tensor("op_1824_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1824_cast_fp16 = slice_by_index(begin = var_1824_begin_0, end = var_1824_end_0, end_mask = var_1824_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1824_cast_fp16")]; + tensor var_1828_begin_0 = const()[name = tensor("op_1828_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_1828_end_0 = const()[name = tensor("op_1828_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_1828_end_mask_0 = const()[name = tensor("op_1828_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1828_cast_fp16 = slice_by_index(begin = var_1828_begin_0, end = var_1828_end_0, end_mask = var_1828_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1828_cast_fp16")]; + tensor var_1832_begin_0 = const()[name = tensor("op_1832_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_1832_end_0 = const()[name = tensor("op_1832_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_1832_end_mask_0 = const()[name = tensor("op_1832_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1832_cast_fp16 = slice_by_index(begin = var_1832_begin_0, end = var_1832_end_0, end_mask = var_1832_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1832_cast_fp16")]; + tensor var_1836_equation_0 = const()[name = tensor("op_1836_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1836_cast_fp16 = einsum(equation = var_1836_equation_0, values = (var_1758_cast_fp16, var_1715_cast_fp16))[name = tensor("op_1836_cast_fp16")]; + tensor var_1837_to_fp16 = const()[name = tensor("op_1837_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_81_cast_fp16 = mul(x = var_1836_cast_fp16, y = var_1837_to_fp16)[name = tensor("aw_81_cast_fp16")]; + tensor var_1840_equation_0 = const()[name = tensor("op_1840_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1840_cast_fp16 = einsum(equation = var_1840_equation_0, values = (var_1762_cast_fp16, var_1719_cast_fp16))[name = tensor("op_1840_cast_fp16")]; + tensor var_1841_to_fp16 = const()[name = tensor("op_1841_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_83_cast_fp16 = mul(x = var_1840_cast_fp16, y = var_1841_to_fp16)[name = tensor("aw_83_cast_fp16")]; + tensor var_1844_equation_0 = const()[name = tensor("op_1844_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1844_cast_fp16 = einsum(equation = var_1844_equation_0, values = (var_1766_cast_fp16, var_1723_cast_fp16))[name = tensor("op_1844_cast_fp16")]; + tensor var_1845_to_fp16 = const()[name = tensor("op_1845_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_85_cast_fp16 = mul(x = var_1844_cast_fp16, y = var_1845_to_fp16)[name = tensor("aw_85_cast_fp16")]; + tensor var_1848_equation_0 = const()[name = tensor("op_1848_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1848_cast_fp16 = einsum(equation = var_1848_equation_0, values = (var_1770_cast_fp16, var_1727_cast_fp16))[name = tensor("op_1848_cast_fp16")]; + tensor var_1849_to_fp16 = const()[name = tensor("op_1849_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_87_cast_fp16 = mul(x = var_1848_cast_fp16, y = var_1849_to_fp16)[name = tensor("aw_87_cast_fp16")]; + tensor var_1852_equation_0 = const()[name = tensor("op_1852_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1852_cast_fp16 = einsum(equation = var_1852_equation_0, values = (var_1774_cast_fp16, var_1731_cast_fp16))[name = tensor("op_1852_cast_fp16")]; + tensor var_1853_to_fp16 = const()[name = tensor("op_1853_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_89_cast_fp16 = mul(x = var_1852_cast_fp16, y = var_1853_to_fp16)[name = tensor("aw_89_cast_fp16")]; + tensor var_1856_equation_0 = const()[name = tensor("op_1856_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1856_cast_fp16 = einsum(equation = var_1856_equation_0, values = (var_1778_cast_fp16, var_1735_cast_fp16))[name = tensor("op_1856_cast_fp16")]; + tensor var_1857_to_fp16 = const()[name = tensor("op_1857_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_91_cast_fp16 = mul(x = var_1856_cast_fp16, y = var_1857_to_fp16)[name = tensor("aw_91_cast_fp16")]; + tensor var_1860_equation_0 = const()[name = tensor("op_1860_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1860_cast_fp16 = einsum(equation = var_1860_equation_0, values = (var_1782_cast_fp16, var_1739_cast_fp16))[name = tensor("op_1860_cast_fp16")]; + tensor var_1861_to_fp16 = const()[name = tensor("op_1861_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_93_cast_fp16 = mul(x = var_1860_cast_fp16, y = var_1861_to_fp16)[name = tensor("aw_93_cast_fp16")]; + tensor var_1864_equation_0 = const()[name = tensor("op_1864_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1864_cast_fp16 = einsum(equation = var_1864_equation_0, values = (var_1786_cast_fp16, var_1743_cast_fp16))[name = tensor("op_1864_cast_fp16")]; + tensor var_1865_to_fp16 = const()[name = tensor("op_1865_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_95_cast_fp16 = mul(x = var_1864_cast_fp16, y = var_1865_to_fp16)[name = tensor("aw_95_cast_fp16")]; + tensor var_1868_equation_0 = const()[name = tensor("op_1868_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1868_cast_fp16 = einsum(equation = var_1868_equation_0, values = (var_1790_cast_fp16, var_1747_cast_fp16))[name = tensor("op_1868_cast_fp16")]; + tensor var_1869_to_fp16 = const()[name = tensor("op_1869_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_97_cast_fp16 = mul(x = var_1868_cast_fp16, y = var_1869_to_fp16)[name = tensor("aw_97_cast_fp16")]; + tensor var_1872_equation_0 = const()[name = tensor("op_1872_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_1872_cast_fp16 = einsum(equation = var_1872_equation_0, values = (var_1794_cast_fp16, var_1751_cast_fp16))[name = tensor("op_1872_cast_fp16")]; + tensor var_1873_to_fp16 = const()[name = tensor("op_1873_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_99_cast_fp16 = mul(x = var_1872_cast_fp16, y = var_1873_to_fp16)[name = tensor("aw_99_cast_fp16")]; + tensor var_1875_cast_fp16 = softmax(axis = var_984, x = aw_81_cast_fp16)[name = tensor("op_1875_cast_fp16")]; + tensor var_1876_cast_fp16 = softmax(axis = var_984, x = aw_83_cast_fp16)[name = tensor("op_1876_cast_fp16")]; + tensor var_1877_cast_fp16 = softmax(axis = var_984, x = aw_85_cast_fp16)[name = tensor("op_1877_cast_fp16")]; + tensor var_1878_cast_fp16 = softmax(axis = var_984, x = aw_87_cast_fp16)[name = tensor("op_1878_cast_fp16")]; + tensor var_1879_cast_fp16 = softmax(axis = var_984, x = aw_89_cast_fp16)[name = tensor("op_1879_cast_fp16")]; + tensor var_1880_cast_fp16 = softmax(axis = var_984, x = aw_91_cast_fp16)[name = tensor("op_1880_cast_fp16")]; + tensor var_1881_cast_fp16 = softmax(axis = var_984, x = aw_93_cast_fp16)[name = tensor("op_1881_cast_fp16")]; + tensor var_1882_cast_fp16 = softmax(axis = var_984, x = aw_95_cast_fp16)[name = tensor("op_1882_cast_fp16")]; + tensor var_1883_cast_fp16 = softmax(axis = var_984, x = aw_97_cast_fp16)[name = tensor("op_1883_cast_fp16")]; + tensor var_1884_cast_fp16 = softmax(axis = var_984, x = aw_99_cast_fp16)[name = tensor("op_1884_cast_fp16")]; + tensor var_1886_equation_0 = const()[name = tensor("op_1886_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1886_cast_fp16 = einsum(equation = var_1886_equation_0, values = (var_1796_cast_fp16, var_1875_cast_fp16))[name = tensor("op_1886_cast_fp16")]; + tensor var_1888_equation_0 = const()[name = tensor("op_1888_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1888_cast_fp16 = einsum(equation = var_1888_equation_0, values = (var_1800_cast_fp16, var_1876_cast_fp16))[name = tensor("op_1888_cast_fp16")]; + tensor var_1890_equation_0 = const()[name = tensor("op_1890_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1890_cast_fp16 = einsum(equation = var_1890_equation_0, values = (var_1804_cast_fp16, var_1877_cast_fp16))[name = tensor("op_1890_cast_fp16")]; + tensor var_1892_equation_0 = const()[name = tensor("op_1892_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1892_cast_fp16 = einsum(equation = var_1892_equation_0, values = (var_1808_cast_fp16, var_1878_cast_fp16))[name = tensor("op_1892_cast_fp16")]; + tensor var_1894_equation_0 = const()[name = tensor("op_1894_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1894_cast_fp16 = einsum(equation = var_1894_equation_0, values = (var_1812_cast_fp16, var_1879_cast_fp16))[name = tensor("op_1894_cast_fp16")]; + tensor var_1896_equation_0 = const()[name = tensor("op_1896_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1896_cast_fp16 = einsum(equation = var_1896_equation_0, values = (var_1816_cast_fp16, var_1880_cast_fp16))[name = tensor("op_1896_cast_fp16")]; + tensor var_1898_equation_0 = const()[name = tensor("op_1898_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1898_cast_fp16 = einsum(equation = var_1898_equation_0, values = (var_1820_cast_fp16, var_1881_cast_fp16))[name = tensor("op_1898_cast_fp16")]; + tensor var_1900_equation_0 = const()[name = tensor("op_1900_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1900_cast_fp16 = einsum(equation = var_1900_equation_0, values = (var_1824_cast_fp16, var_1882_cast_fp16))[name = tensor("op_1900_cast_fp16")]; + tensor var_1902_equation_0 = const()[name = tensor("op_1902_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1902_cast_fp16 = einsum(equation = var_1902_equation_0, values = (var_1828_cast_fp16, var_1883_cast_fp16))[name = tensor("op_1902_cast_fp16")]; + tensor var_1904_equation_0 = const()[name = tensor("op_1904_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_1904_cast_fp16 = einsum(equation = var_1904_equation_0, values = (var_1832_cast_fp16, var_1884_cast_fp16))[name = tensor("op_1904_cast_fp16")]; + tensor input_105_interleave_0 = const()[name = tensor("input_105_interleave_0"), val = tensor(false)]; + tensor input_105_cast_fp16 = concat(axis = var_984, interleave = input_105_interleave_0, values = (var_1886_cast_fp16, var_1888_cast_fp16, var_1890_cast_fp16, var_1892_cast_fp16, var_1894_cast_fp16, var_1896_cast_fp16, var_1898_cast_fp16, var_1900_cast_fp16, var_1902_cast_fp16, var_1904_cast_fp16))[name = tensor("input_105_cast_fp16")]; + tensor var_1910 = const()[name = tensor("op_1910"), val = tensor([1, 1])]; + tensor var_1912 = const()[name = tensor("op_1912"), val = tensor([1, 1])]; + tensor var_1914_pad_type_0 = const()[name = tensor("op_1914_pad_type_0"), val = tensor("custom")]; + tensor var_1914_pad_0 = const()[name = tensor("op_1914_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(77667072)))]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78486336)))]; + tensor var_1914_cast_fp16 = conv(bias = down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_1912, groups = var_984, pad = var_1914_pad_0, pad_type = var_1914_pad_type_0, strides = var_1910, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_105_cast_fp16)[name = tensor("op_1914_cast_fp16")]; + tensor inputs_21_cast_fp16 = add(x = var_1914_cast_fp16, y = inputs_19_cast_fp16)[name = tensor("inputs_21_cast_fp16")]; + tensor var_1918 = const()[name = tensor("op_1918"), val = tensor([1])]; + tensor channels_mean_21_cast_fp16 = reduce_mean(axes = var_1918, keep_dims = var_979, x = inputs_21_cast_fp16)[name = tensor("channels_mean_21_cast_fp16")]; + tensor zero_mean_21_cast_fp16 = sub(x = inputs_21_cast_fp16, y = channels_mean_21_cast_fp16)[name = tensor("zero_mean_21_cast_fp16")]; + tensor zero_mean_sq_21_cast_fp16 = mul(x = zero_mean_21_cast_fp16, y = zero_mean_21_cast_fp16)[name = tensor("zero_mean_sq_21_cast_fp16")]; + tensor var_1922 = const()[name = tensor("op_1922"), val = tensor([1])]; + tensor var_1923_cast_fp16 = reduce_mean(axes = var_1922, keep_dims = var_979, x = zero_mean_sq_21_cast_fp16)[name = tensor("op_1923_cast_fp16")]; + tensor var_1924_to_fp16 = const()[name = tensor("op_1924_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1925_cast_fp16 = add(x = var_1923_cast_fp16, y = var_1924_to_fp16)[name = tensor("op_1925_cast_fp16")]; + tensor denom_21_epsilon_0_to_fp16 = const()[name = tensor("denom_21_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_21_cast_fp16 = rsqrt(epsilon = denom_21_epsilon_0_to_fp16, x = var_1925_cast_fp16)[name = tensor("denom_21_cast_fp16")]; + tensor out_21_cast_fp16 = mul(x = zero_mean_21_cast_fp16, y = denom_21_cast_fp16)[name = tensor("out_21_cast_fp16")]; + tensor var_1929_to_fp16 = const()[name = tensor("op_1929_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78487680)))]; + tensor var_1930_cast_fp16 = add(x = out_21_cast_fp16, y = var_1929_to_fp16)[name = tensor("op_1930_cast_fp16")]; + tensor var_1932_to_fp16 = const()[name = tensor("op_1932_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78489024)))]; + tensor hidden_states_65_cast_fp16 = mul(x = var_1930_cast_fp16, y = var_1932_to_fp16)[name = tensor("hidden_states_65_cast_fp16")]; + tensor var_1939 = const()[name = tensor("op_1939"), val = tensor([1, 1])]; + tensor var_1941 = const()[name = tensor("op_1941"), val = tensor([1, 1])]; + tensor q_15_pad_type_0 = const()[name = tensor("q_15_pad_type_0"), val = tensor("custom")]; + tensor q_15_pad_0 = const()[name = tensor("q_15_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78490368)))]; + tensor q_15_cast_fp16 = conv(dilations = var_1941, groups = var_984, pad = q_15_pad_0, pad_type = q_15_pad_type_0, strides = var_1939, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_65_cast_fp16)[name = tensor("q_15_cast_fp16")]; + tensor var_1945 = const()[name = tensor("op_1945"), val = tensor([1, 1])]; + tensor var_1947 = const()[name = tensor("op_1947"), val = tensor([1, 1])]; + tensor k_29_pad_type_0 = const()[name = tensor("k_29_pad_type_0"), val = tensor("custom")]; + tensor k_29_pad_0 = const()[name = tensor("k_29_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(79309632)))]; + tensor k_29_cast_fp16 = conv(dilations = var_1947, groups = var_984, pad = k_29_pad_0, pad_type = k_29_pad_type_0, strides = var_1945, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_29_cast_fp16")]; + tensor var_1951 = const()[name = tensor("op_1951"), val = tensor([1, 1])]; + tensor var_1953 = const()[name = tensor("op_1953"), val = tensor([1, 1])]; + tensor v_15_pad_type_0 = const()[name = tensor("v_15_pad_type_0"), val = tensor("custom")]; + tensor v_15_pad_0 = const()[name = tensor("v_15_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80620416)))]; + tensor v_15_cast_fp16 = conv(dilations = var_1953, groups = var_984, pad = v_15_pad_0, pad_type = v_15_pad_type_0, strides = var_1951, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_15_cast_fp16")]; + tensor var_1957_begin_0 = const()[name = tensor("op_1957_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_1957_end_0 = const()[name = tensor("op_1957_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_1957_end_mask_0 = const()[name = tensor("op_1957_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1957_cast_fp16 = slice_by_index(begin = var_1957_begin_0, end = var_1957_end_0, end_mask = var_1957_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1957_cast_fp16")]; + tensor var_1961_begin_0 = const()[name = tensor("op_1961_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_1961_end_0 = const()[name = tensor("op_1961_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_1961_end_mask_0 = const()[name = tensor("op_1961_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1961_cast_fp16 = slice_by_index(begin = var_1961_begin_0, end = var_1961_end_0, end_mask = var_1961_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1961_cast_fp16")]; + tensor var_1965_begin_0 = const()[name = tensor("op_1965_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_1965_end_0 = const()[name = tensor("op_1965_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_1965_end_mask_0 = const()[name = tensor("op_1965_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1965_cast_fp16 = slice_by_index(begin = var_1965_begin_0, end = var_1965_end_0, end_mask = var_1965_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1965_cast_fp16")]; + tensor var_1969_begin_0 = const()[name = tensor("op_1969_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_1969_end_0 = const()[name = tensor("op_1969_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_1969_end_mask_0 = const()[name = tensor("op_1969_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1969_cast_fp16 = slice_by_index(begin = var_1969_begin_0, end = var_1969_end_0, end_mask = var_1969_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1969_cast_fp16")]; + tensor var_1973_begin_0 = const()[name = tensor("op_1973_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_1973_end_0 = const()[name = tensor("op_1973_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_1973_end_mask_0 = const()[name = tensor("op_1973_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1973_cast_fp16 = slice_by_index(begin = var_1973_begin_0, end = var_1973_end_0, end_mask = var_1973_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1973_cast_fp16")]; + tensor var_1977_begin_0 = const()[name = tensor("op_1977_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_1977_end_0 = const()[name = tensor("op_1977_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_1977_end_mask_0 = const()[name = tensor("op_1977_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1977_cast_fp16 = slice_by_index(begin = var_1977_begin_0, end = var_1977_end_0, end_mask = var_1977_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1977_cast_fp16")]; + tensor var_1981_begin_0 = const()[name = tensor("op_1981_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_1981_end_0 = const()[name = tensor("op_1981_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_1981_end_mask_0 = const()[name = tensor("op_1981_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1981_cast_fp16 = slice_by_index(begin = var_1981_begin_0, end = var_1981_end_0, end_mask = var_1981_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1981_cast_fp16")]; + tensor var_1985_begin_0 = const()[name = tensor("op_1985_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_1985_end_0 = const()[name = tensor("op_1985_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_1985_end_mask_0 = const()[name = tensor("op_1985_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1985_cast_fp16 = slice_by_index(begin = var_1985_begin_0, end = var_1985_end_0, end_mask = var_1985_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1985_cast_fp16")]; + tensor var_1989_begin_0 = const()[name = tensor("op_1989_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_1989_end_0 = const()[name = tensor("op_1989_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_1989_end_mask_0 = const()[name = tensor("op_1989_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1989_cast_fp16 = slice_by_index(begin = var_1989_begin_0, end = var_1989_end_0, end_mask = var_1989_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1989_cast_fp16")]; + tensor var_1993_begin_0 = const()[name = tensor("op_1993_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_1993_end_0 = const()[name = tensor("op_1993_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_1993_end_mask_0 = const()[name = tensor("op_1993_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_1993_cast_fp16 = slice_by_index(begin = var_1993_begin_0, end = var_1993_end_0, end_mask = var_1993_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1993_cast_fp16")]; + tensor k_31_perm_0 = const()[name = tensor("k_31_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_2000_begin_0 = const()[name = tensor("op_2000_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_2000_end_0 = const()[name = tensor("op_2000_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_2000_end_mask_0 = const()[name = tensor("op_2000_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_24 = transpose(perm = k_31_perm_0, x = k_29_cast_fp16)[name = tensor("transpose_24")]; + tensor var_2000_cast_fp16 = slice_by_index(begin = var_2000_begin_0, end = var_2000_end_0, end_mask = var_2000_end_mask_0, x = transpose_24)[name = tensor("op_2000_cast_fp16")]; + tensor var_2004_begin_0 = const()[name = tensor("op_2004_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_2004_end_0 = const()[name = tensor("op_2004_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_2004_end_mask_0 = const()[name = tensor("op_2004_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2004_cast_fp16 = slice_by_index(begin = var_2004_begin_0, end = var_2004_end_0, end_mask = var_2004_end_mask_0, x = transpose_24)[name = tensor("op_2004_cast_fp16")]; + tensor var_2008_begin_0 = const()[name = tensor("op_2008_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_2008_end_0 = const()[name = tensor("op_2008_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_2008_end_mask_0 = const()[name = tensor("op_2008_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2008_cast_fp16 = slice_by_index(begin = var_2008_begin_0, end = var_2008_end_0, end_mask = var_2008_end_mask_0, x = transpose_24)[name = tensor("op_2008_cast_fp16")]; + tensor var_2012_begin_0 = const()[name = tensor("op_2012_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_2012_end_0 = const()[name = tensor("op_2012_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_2012_end_mask_0 = const()[name = tensor("op_2012_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2012_cast_fp16 = slice_by_index(begin = var_2012_begin_0, end = var_2012_end_0, end_mask = var_2012_end_mask_0, x = transpose_24)[name = tensor("op_2012_cast_fp16")]; + tensor var_2016_begin_0 = const()[name = tensor("op_2016_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_2016_end_0 = const()[name = tensor("op_2016_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_2016_end_mask_0 = const()[name = tensor("op_2016_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2016_cast_fp16 = slice_by_index(begin = var_2016_begin_0, end = var_2016_end_0, end_mask = var_2016_end_mask_0, x = transpose_24)[name = tensor("op_2016_cast_fp16")]; + tensor var_2020_begin_0 = const()[name = tensor("op_2020_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_2020_end_0 = const()[name = tensor("op_2020_end_0"), val = tensor([2, 77, 1, 384])]; + tensor var_2020_end_mask_0 = const()[name = tensor("op_2020_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2020_cast_fp16 = slice_by_index(begin = var_2020_begin_0, end = var_2020_end_0, end_mask = var_2020_end_mask_0, x = transpose_24)[name = tensor("op_2020_cast_fp16")]; + tensor var_2024_begin_0 = const()[name = tensor("op_2024_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_2024_end_0 = const()[name = tensor("op_2024_end_0"), val = tensor([2, 77, 1, 448])]; + tensor var_2024_end_mask_0 = const()[name = tensor("op_2024_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2024_cast_fp16 = slice_by_index(begin = var_2024_begin_0, end = var_2024_end_0, end_mask = var_2024_end_mask_0, x = transpose_24)[name = tensor("op_2024_cast_fp16")]; + tensor var_2028_begin_0 = const()[name = tensor("op_2028_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_2028_end_0 = const()[name = tensor("op_2028_end_0"), val = tensor([2, 77, 1, 512])]; + tensor var_2028_end_mask_0 = const()[name = tensor("op_2028_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2028_cast_fp16 = slice_by_index(begin = var_2028_begin_0, end = var_2028_end_0, end_mask = var_2028_end_mask_0, x = transpose_24)[name = tensor("op_2028_cast_fp16")]; + tensor var_2032_begin_0 = const()[name = tensor("op_2032_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_2032_end_0 = const()[name = tensor("op_2032_end_0"), val = tensor([2, 77, 1, 576])]; + tensor var_2032_end_mask_0 = const()[name = tensor("op_2032_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2032_cast_fp16 = slice_by_index(begin = var_2032_begin_0, end = var_2032_end_0, end_mask = var_2032_end_mask_0, x = transpose_24)[name = tensor("op_2032_cast_fp16")]; + tensor var_2036_begin_0 = const()[name = tensor("op_2036_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_2036_end_0 = const()[name = tensor("op_2036_end_0"), val = tensor([2, 77, 1, 640])]; + tensor var_2036_end_mask_0 = const()[name = tensor("op_2036_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2036_cast_fp16 = slice_by_index(begin = var_2036_begin_0, end = var_2036_end_0, end_mask = var_2036_end_mask_0, x = transpose_24)[name = tensor("op_2036_cast_fp16")]; + tensor var_2038_begin_0 = const()[name = tensor("op_2038_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_2038_end_0 = const()[name = tensor("op_2038_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_2038_end_mask_0 = const()[name = tensor("op_2038_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2038_cast_fp16 = slice_by_index(begin = var_2038_begin_0, end = var_2038_end_0, end_mask = var_2038_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2038_cast_fp16")]; + tensor var_2042_begin_0 = const()[name = tensor("op_2042_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_2042_end_0 = const()[name = tensor("op_2042_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_2042_end_mask_0 = const()[name = tensor("op_2042_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2042_cast_fp16 = slice_by_index(begin = var_2042_begin_0, end = var_2042_end_0, end_mask = var_2042_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2042_cast_fp16")]; + tensor var_2046_begin_0 = const()[name = tensor("op_2046_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_2046_end_0 = const()[name = tensor("op_2046_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_2046_end_mask_0 = const()[name = tensor("op_2046_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2046_cast_fp16 = slice_by_index(begin = var_2046_begin_0, end = var_2046_end_0, end_mask = var_2046_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2046_cast_fp16")]; + tensor var_2050_begin_0 = const()[name = tensor("op_2050_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_2050_end_0 = const()[name = tensor("op_2050_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_2050_end_mask_0 = const()[name = tensor("op_2050_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2050_cast_fp16 = slice_by_index(begin = var_2050_begin_0, end = var_2050_end_0, end_mask = var_2050_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2050_cast_fp16")]; + tensor var_2054_begin_0 = const()[name = tensor("op_2054_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_2054_end_0 = const()[name = tensor("op_2054_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_2054_end_mask_0 = const()[name = tensor("op_2054_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2054_cast_fp16 = slice_by_index(begin = var_2054_begin_0, end = var_2054_end_0, end_mask = var_2054_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2054_cast_fp16")]; + tensor var_2058_begin_0 = const()[name = tensor("op_2058_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_2058_end_0 = const()[name = tensor("op_2058_end_0"), val = tensor([2, 384, 1, 77])]; + tensor var_2058_end_mask_0 = const()[name = tensor("op_2058_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2058_cast_fp16 = slice_by_index(begin = var_2058_begin_0, end = var_2058_end_0, end_mask = var_2058_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2058_cast_fp16")]; + tensor var_2062_begin_0 = const()[name = tensor("op_2062_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_2062_end_0 = const()[name = tensor("op_2062_end_0"), val = tensor([2, 448, 1, 77])]; + tensor var_2062_end_mask_0 = const()[name = tensor("op_2062_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2062_cast_fp16 = slice_by_index(begin = var_2062_begin_0, end = var_2062_end_0, end_mask = var_2062_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2062_cast_fp16")]; + tensor var_2066_begin_0 = const()[name = tensor("op_2066_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_2066_end_0 = const()[name = tensor("op_2066_end_0"), val = tensor([2, 512, 1, 77])]; + tensor var_2066_end_mask_0 = const()[name = tensor("op_2066_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2066_cast_fp16 = slice_by_index(begin = var_2066_begin_0, end = var_2066_end_0, end_mask = var_2066_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2066_cast_fp16")]; + tensor var_2070_begin_0 = const()[name = tensor("op_2070_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_2070_end_0 = const()[name = tensor("op_2070_end_0"), val = tensor([2, 576, 1, 77])]; + tensor var_2070_end_mask_0 = const()[name = tensor("op_2070_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2070_cast_fp16 = slice_by_index(begin = var_2070_begin_0, end = var_2070_end_0, end_mask = var_2070_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2070_cast_fp16")]; + tensor var_2074_begin_0 = const()[name = tensor("op_2074_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_2074_end_0 = const()[name = tensor("op_2074_end_0"), val = tensor([2, 640, 1, 77])]; + tensor var_2074_end_mask_0 = const()[name = tensor("op_2074_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2074_cast_fp16 = slice_by_index(begin = var_2074_begin_0, end = var_2074_end_0, end_mask = var_2074_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2074_cast_fp16")]; + tensor var_2078_equation_0 = const()[name = tensor("op_2078_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2078_cast_fp16 = einsum(equation = var_2078_equation_0, values = (var_2000_cast_fp16, var_1957_cast_fp16))[name = tensor("op_2078_cast_fp16")]; + tensor var_2079_to_fp16 = const()[name = tensor("op_2079_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_101_cast_fp16 = mul(x = var_2078_cast_fp16, y = var_2079_to_fp16)[name = tensor("aw_101_cast_fp16")]; + tensor var_2082_equation_0 = const()[name = tensor("op_2082_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2082_cast_fp16 = einsum(equation = var_2082_equation_0, values = (var_2004_cast_fp16, var_1961_cast_fp16))[name = tensor("op_2082_cast_fp16")]; + tensor var_2083_to_fp16 = const()[name = tensor("op_2083_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_103_cast_fp16 = mul(x = var_2082_cast_fp16, y = var_2083_to_fp16)[name = tensor("aw_103_cast_fp16")]; + tensor var_2086_equation_0 = const()[name = tensor("op_2086_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2086_cast_fp16 = einsum(equation = var_2086_equation_0, values = (var_2008_cast_fp16, var_1965_cast_fp16))[name = tensor("op_2086_cast_fp16")]; + tensor var_2087_to_fp16 = const()[name = tensor("op_2087_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_105_cast_fp16 = mul(x = var_2086_cast_fp16, y = var_2087_to_fp16)[name = tensor("aw_105_cast_fp16")]; + tensor var_2090_equation_0 = const()[name = tensor("op_2090_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2090_cast_fp16 = einsum(equation = var_2090_equation_0, values = (var_2012_cast_fp16, var_1969_cast_fp16))[name = tensor("op_2090_cast_fp16")]; + tensor var_2091_to_fp16 = const()[name = tensor("op_2091_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_107_cast_fp16 = mul(x = var_2090_cast_fp16, y = var_2091_to_fp16)[name = tensor("aw_107_cast_fp16")]; + tensor var_2094_equation_0 = const()[name = tensor("op_2094_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2094_cast_fp16 = einsum(equation = var_2094_equation_0, values = (var_2016_cast_fp16, var_1973_cast_fp16))[name = tensor("op_2094_cast_fp16")]; + tensor var_2095_to_fp16 = const()[name = tensor("op_2095_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_109_cast_fp16 = mul(x = var_2094_cast_fp16, y = var_2095_to_fp16)[name = tensor("aw_109_cast_fp16")]; + tensor var_2098_equation_0 = const()[name = tensor("op_2098_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2098_cast_fp16 = einsum(equation = var_2098_equation_0, values = (var_2020_cast_fp16, var_1977_cast_fp16))[name = tensor("op_2098_cast_fp16")]; + tensor var_2099_to_fp16 = const()[name = tensor("op_2099_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_111_cast_fp16 = mul(x = var_2098_cast_fp16, y = var_2099_to_fp16)[name = tensor("aw_111_cast_fp16")]; + tensor var_2102_equation_0 = const()[name = tensor("op_2102_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2102_cast_fp16 = einsum(equation = var_2102_equation_0, values = (var_2024_cast_fp16, var_1981_cast_fp16))[name = tensor("op_2102_cast_fp16")]; + tensor var_2103_to_fp16 = const()[name = tensor("op_2103_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_113_cast_fp16 = mul(x = var_2102_cast_fp16, y = var_2103_to_fp16)[name = tensor("aw_113_cast_fp16")]; + tensor var_2106_equation_0 = const()[name = tensor("op_2106_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2106_cast_fp16 = einsum(equation = var_2106_equation_0, values = (var_2028_cast_fp16, var_1985_cast_fp16))[name = tensor("op_2106_cast_fp16")]; + tensor var_2107_to_fp16 = const()[name = tensor("op_2107_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_115_cast_fp16 = mul(x = var_2106_cast_fp16, y = var_2107_to_fp16)[name = tensor("aw_115_cast_fp16")]; + tensor var_2110_equation_0 = const()[name = tensor("op_2110_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2110_cast_fp16 = einsum(equation = var_2110_equation_0, values = (var_2032_cast_fp16, var_1989_cast_fp16))[name = tensor("op_2110_cast_fp16")]; + tensor var_2111_to_fp16 = const()[name = tensor("op_2111_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_117_cast_fp16 = mul(x = var_2110_cast_fp16, y = var_2111_to_fp16)[name = tensor("aw_117_cast_fp16")]; + tensor var_2114_equation_0 = const()[name = tensor("op_2114_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2114_cast_fp16 = einsum(equation = var_2114_equation_0, values = (var_2036_cast_fp16, var_1993_cast_fp16))[name = tensor("op_2114_cast_fp16")]; + tensor var_2115_to_fp16 = const()[name = tensor("op_2115_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_119_cast_fp16 = mul(x = var_2114_cast_fp16, y = var_2115_to_fp16)[name = tensor("aw_119_cast_fp16")]; + tensor var_2117_cast_fp16 = softmax(axis = var_984, x = aw_101_cast_fp16)[name = tensor("op_2117_cast_fp16")]; + tensor var_2118_cast_fp16 = softmax(axis = var_984, x = aw_103_cast_fp16)[name = tensor("op_2118_cast_fp16")]; + tensor var_2119_cast_fp16 = softmax(axis = var_984, x = aw_105_cast_fp16)[name = tensor("op_2119_cast_fp16")]; + tensor var_2120_cast_fp16 = softmax(axis = var_984, x = aw_107_cast_fp16)[name = tensor("op_2120_cast_fp16")]; + tensor var_2121_cast_fp16 = softmax(axis = var_984, x = aw_109_cast_fp16)[name = tensor("op_2121_cast_fp16")]; + tensor var_2122_cast_fp16 = softmax(axis = var_984, x = aw_111_cast_fp16)[name = tensor("op_2122_cast_fp16")]; + tensor var_2123_cast_fp16 = softmax(axis = var_984, x = aw_113_cast_fp16)[name = tensor("op_2123_cast_fp16")]; + tensor var_2124_cast_fp16 = softmax(axis = var_984, x = aw_115_cast_fp16)[name = tensor("op_2124_cast_fp16")]; + tensor var_2125_cast_fp16 = softmax(axis = var_984, x = aw_117_cast_fp16)[name = tensor("op_2125_cast_fp16")]; + tensor var_2126_cast_fp16 = softmax(axis = var_984, x = aw_119_cast_fp16)[name = tensor("op_2126_cast_fp16")]; + tensor var_2128_equation_0 = const()[name = tensor("op_2128_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2128_cast_fp16 = einsum(equation = var_2128_equation_0, values = (var_2038_cast_fp16, var_2117_cast_fp16))[name = tensor("op_2128_cast_fp16")]; + tensor var_2130_equation_0 = const()[name = tensor("op_2130_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2130_cast_fp16 = einsum(equation = var_2130_equation_0, values = (var_2042_cast_fp16, var_2118_cast_fp16))[name = tensor("op_2130_cast_fp16")]; + tensor var_2132_equation_0 = const()[name = tensor("op_2132_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2132_cast_fp16 = einsum(equation = var_2132_equation_0, values = (var_2046_cast_fp16, var_2119_cast_fp16))[name = tensor("op_2132_cast_fp16")]; + tensor var_2134_equation_0 = const()[name = tensor("op_2134_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2134_cast_fp16 = einsum(equation = var_2134_equation_0, values = (var_2050_cast_fp16, var_2120_cast_fp16))[name = tensor("op_2134_cast_fp16")]; + tensor var_2136_equation_0 = const()[name = tensor("op_2136_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2136_cast_fp16 = einsum(equation = var_2136_equation_0, values = (var_2054_cast_fp16, var_2121_cast_fp16))[name = tensor("op_2136_cast_fp16")]; + tensor var_2138_equation_0 = const()[name = tensor("op_2138_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2138_cast_fp16 = einsum(equation = var_2138_equation_0, values = (var_2058_cast_fp16, var_2122_cast_fp16))[name = tensor("op_2138_cast_fp16")]; + tensor var_2140_equation_0 = const()[name = tensor("op_2140_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2140_cast_fp16 = einsum(equation = var_2140_equation_0, values = (var_2062_cast_fp16, var_2123_cast_fp16))[name = tensor("op_2140_cast_fp16")]; + tensor var_2142_equation_0 = const()[name = tensor("op_2142_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2142_cast_fp16 = einsum(equation = var_2142_equation_0, values = (var_2066_cast_fp16, var_2124_cast_fp16))[name = tensor("op_2142_cast_fp16")]; + tensor var_2144_equation_0 = const()[name = tensor("op_2144_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2144_cast_fp16 = einsum(equation = var_2144_equation_0, values = (var_2070_cast_fp16, var_2125_cast_fp16))[name = tensor("op_2144_cast_fp16")]; + tensor var_2146_equation_0 = const()[name = tensor("op_2146_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2146_cast_fp16 = einsum(equation = var_2146_equation_0, values = (var_2074_cast_fp16, var_2126_cast_fp16))[name = tensor("op_2146_cast_fp16")]; + tensor input_107_interleave_0 = const()[name = tensor("input_107_interleave_0"), val = tensor(false)]; + tensor input_107_cast_fp16 = concat(axis = var_984, interleave = input_107_interleave_0, values = (var_2128_cast_fp16, var_2130_cast_fp16, var_2132_cast_fp16, var_2134_cast_fp16, var_2136_cast_fp16, var_2138_cast_fp16, var_2140_cast_fp16, var_2142_cast_fp16, var_2144_cast_fp16, var_2146_cast_fp16))[name = tensor("input_107_cast_fp16")]; + tensor var_2152 = const()[name = tensor("op_2152"), val = tensor([1, 1])]; + tensor var_2154 = const()[name = tensor("op_2154"), val = tensor([1, 1])]; + tensor var_2156_pad_type_0 = const()[name = tensor("op_2156_pad_type_0"), val = tensor("custom")]; + tensor var_2156_pad_0 = const()[name = tensor("op_2156_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(81931200)))]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82750464)))]; + tensor var_2156_cast_fp16 = conv(bias = down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_2154, groups = var_984, pad = var_2156_pad_0, pad_type = var_2156_pad_type_0, strides = var_2152, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_107_cast_fp16)[name = tensor("op_2156_cast_fp16")]; + tensor inputs_23_cast_fp16 = add(x = var_2156_cast_fp16, y = inputs_21_cast_fp16)[name = tensor("inputs_23_cast_fp16")]; + tensor var_2160 = const()[name = tensor("op_2160"), val = tensor([1])]; + tensor channels_mean_23_cast_fp16 = reduce_mean(axes = var_2160, keep_dims = var_979, x = inputs_23_cast_fp16)[name = tensor("channels_mean_23_cast_fp16")]; + tensor zero_mean_23_cast_fp16 = sub(x = inputs_23_cast_fp16, y = channels_mean_23_cast_fp16)[name = tensor("zero_mean_23_cast_fp16")]; + tensor zero_mean_sq_23_cast_fp16 = mul(x = zero_mean_23_cast_fp16, y = zero_mean_23_cast_fp16)[name = tensor("zero_mean_sq_23_cast_fp16")]; + tensor var_2164 = const()[name = tensor("op_2164"), val = tensor([1])]; + tensor var_2165_cast_fp16 = reduce_mean(axes = var_2164, keep_dims = var_979, x = zero_mean_sq_23_cast_fp16)[name = tensor("op_2165_cast_fp16")]; + tensor var_2166_to_fp16 = const()[name = tensor("op_2166_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_2167_cast_fp16 = add(x = var_2165_cast_fp16, y = var_2166_to_fp16)[name = tensor("op_2167_cast_fp16")]; + tensor denom_23_epsilon_0_to_fp16 = const()[name = tensor("denom_23_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_23_cast_fp16 = rsqrt(epsilon = denom_23_epsilon_0_to_fp16, x = var_2167_cast_fp16)[name = tensor("denom_23_cast_fp16")]; + tensor out_23_cast_fp16 = mul(x = zero_mean_23_cast_fp16, y = denom_23_cast_fp16)[name = tensor("out_23_cast_fp16")]; + tensor var_2171_to_fp16 = const()[name = tensor("op_2171_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82751808)))]; + tensor var_2172_cast_fp16 = add(x = out_23_cast_fp16, y = var_2171_to_fp16)[name = tensor("op_2172_cast_fp16")]; + tensor var_2174_to_fp16 = const()[name = tensor("op_2174_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82753152)))]; + tensor input_109_cast_fp16 = mul(x = var_2172_cast_fp16, y = var_2174_to_fp16)[name = tensor("input_109_cast_fp16")]; + tensor var_2182 = const()[name = tensor("op_2182"), val = tensor([1, 1])]; + tensor var_2184 = const()[name = tensor("op_2184"), val = tensor([1, 1])]; + tensor var_2186_pad_type_0 = const()[name = tensor("op_2186_pad_type_0"), val = tensor("custom")]; + tensor var_2186_pad_0 = const()[name = tensor("op_2186_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82754496)))]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89308160)))]; + tensor var_2186_cast_fp16 = conv(bias = down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_2184, groups = var_984, pad = var_2186_pad_0, pad_type = var_2186_pad_type_0, strides = var_2182, weight = down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_109_cast_fp16)[name = tensor("op_2186_cast_fp16")]; + tensor var_2187_split_sizes_0 = const()[name = tensor("op_2187_split_sizes_0"), val = tensor([2560, 2560])]; + tensor var_2187_axis_0 = const()[name = tensor("op_2187_axis_0"), val = tensor(1)]; + tensor var_2187_cast_fp16_0, tensor var_2187_cast_fp16_1 = split(axis = var_2187_axis_0, split_sizes = var_2187_split_sizes_0, x = var_2186_cast_fp16)[name = tensor("op_2187_cast_fp16")]; + tensor var_2189_mode_0 = const()[name = tensor("op_2189_mode_0"), val = tensor("EXACT")]; + tensor var_2189_cast_fp16 = gelu(mode = var_2189_mode_0, x = var_2187_cast_fp16_1)[name = tensor("op_2189_cast_fp16")]; + tensor input_111_cast_fp16 = mul(x = var_2187_cast_fp16_0, y = var_2189_cast_fp16)[name = tensor("input_111_cast_fp16")]; + tensor var_2193 = const()[name = tensor("op_2193"), val = tensor([1, 1])]; + tensor var_2195 = const()[name = tensor("op_2195"), val = tensor([1, 1])]; + tensor var_2197_pad_type_0 = const()[name = tensor("op_2197_pad_type_0"), val = tensor("custom")]; + tensor var_2197_pad_0 = const()[name = tensor("op_2197_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89318464)))]; + tensor down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(92595328)))]; + tensor var_2197_cast_fp16 = conv(bias = down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_2195, groups = var_984, pad = var_2197_pad_0, pad_type = var_2197_pad_type_0, strides = var_2193, weight = down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_111_cast_fp16)[name = tensor("op_2197_cast_fp16")]; + tensor hidden_states_69_cast_fp16 = add(x = var_2197_cast_fp16, y = inputs_23_cast_fp16)[name = tensor("hidden_states_69_cast_fp16")]; + tensor var_2199 = const()[name = tensor("op_2199"), val = tensor([2, 640, 24, 24])]; + tensor input_113_cast_fp16 = reshape(shape = var_2199, x = hidden_states_69_cast_fp16)[name = tensor("input_113_cast_fp16")]; + tensor var_2203 = const()[name = tensor("op_2203"), val = tensor([1, 1])]; + tensor var_2205 = const()[name = tensor("op_2205"), val = tensor([1, 1])]; + tensor hidden_states_71_pad_type_0 = const()[name = tensor("hidden_states_71_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_71_pad_0 = const()[name = tensor("hidden_states_71_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_1_attentions_1_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(92596672)))]; + tensor down_blocks_1_attentions_1_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93415936)))]; + tensor hidden_states_71_cast_fp16 = conv(bias = down_blocks_1_attentions_1_proj_out_bias_to_fp16, dilations = var_2205, groups = var_984, pad = hidden_states_71_pad_0, pad_type = hidden_states_71_pad_type_0, strides = var_2203, weight = down_blocks_1_attentions_1_proj_out_weight_to_fp16, x = input_113_cast_fp16)[name = tensor("hidden_states_71_cast_fp16")]; + tensor input_115_cast_fp16 = add(x = hidden_states_71_cast_fp16, y = hidden_states_59_cast_fp16)[name = tensor("input_115_cast_fp16")]; + tensor var_2212 = const()[name = tensor("op_2212"), val = tensor([2, 2])]; + tensor var_2214 = const()[name = tensor("op_2214"), val = tensor([1, 1])]; + tensor input_117_pad_type_0 = const()[name = tensor("input_117_pad_type_0"), val = tensor("custom")]; + tensor input_117_pad_0 = const()[name = tensor("input_117_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_1_downsamplers_0_conv_weight_to_fp16 = const()[name = tensor("down_blocks_1_downsamplers_0_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93417280)))]; + tensor down_blocks_1_downsamplers_0_conv_bias_to_fp16 = const()[name = tensor("down_blocks_1_downsamplers_0_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100790144)))]; + tensor input_117_cast_fp16 = conv(bias = down_blocks_1_downsamplers_0_conv_bias_to_fp16, dilations = var_2214, groups = var_984, pad = input_117_pad_0, pad_type = input_117_pad_type_0, strides = var_2212, weight = down_blocks_1_downsamplers_0_conv_weight_to_fp16, x = input_115_cast_fp16)[name = tensor("input_117_cast_fp16")]; + tensor var_2249 = const()[name = tensor("op_2249"), val = tensor(true)]; + tensor var_2254 = const()[name = tensor("op_2254"), val = tensor(1)]; + tensor reshape_48_shape_0 = const()[name = tensor("reshape_48_shape_0"), val = tensor([2, 32, 20, 12, 12])]; + tensor reshape_48_cast_fp16 = reshape(shape = reshape_48_shape_0, x = input_117_cast_fp16)[name = tensor("reshape_48_cast_fp16")]; + tensor reduce_mean_36_axes_0 = const()[name = tensor("reduce_mean_36_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_36_keep_dims_0 = const()[name = tensor("reduce_mean_36_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_36_cast_fp16 = reduce_mean(axes = reduce_mean_36_axes_0, keep_dims = reduce_mean_36_keep_dims_0, x = reshape_48_cast_fp16)[name = tensor("reduce_mean_36_cast_fp16")]; + tensor sub_24_cast_fp16 = sub(x = reshape_48_cast_fp16, y = reduce_mean_36_cast_fp16)[name = tensor("sub_24_cast_fp16")]; + tensor square_12_cast_fp16 = square(x = sub_24_cast_fp16)[name = tensor("square_12_cast_fp16")]; + tensor reduce_mean_38_axes_0 = const()[name = tensor("reduce_mean_38_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_38_keep_dims_0 = const()[name = tensor("reduce_mean_38_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_38_cast_fp16 = reduce_mean(axes = reduce_mean_38_axes_0, keep_dims = reduce_mean_38_keep_dims_0, x = square_12_cast_fp16)[name = tensor("reduce_mean_38_cast_fp16")]; + tensor add_24_y_0_to_fp16 = const()[name = tensor("add_24_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_24_cast_fp16 = add(x = reduce_mean_38_cast_fp16, y = add_24_y_0_to_fp16)[name = tensor("add_24_cast_fp16")]; + tensor sqrt_12_cast_fp16 = sqrt(x = add_24_cast_fp16)[name = tensor("sqrt_12_cast_fp16")]; + tensor real_div_12_cast_fp16 = real_div(x = sub_24_cast_fp16, y = sqrt_12_cast_fp16)[name = tensor("real_div_12_cast_fp16")]; + tensor reshape_49_shape_0 = const()[name = tensor("reshape_49_shape_0"), val = tensor([2, 640, 12, 12])]; + tensor reshape_49_cast_fp16 = reshape(shape = reshape_49_shape_0, x = real_div_12_cast_fp16)[name = tensor("reshape_49_cast_fp16")]; + tensor add_25_gamma_0_to_fp16 = const()[name = tensor("add_25_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100791488)))]; + tensor add_25_beta_0_to_fp16 = const()[name = tensor("add_25_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100792832)))]; + tensor add_25_epsilon_0_to_fp16 = const()[name = tensor("add_25_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_25_cast_fp16 = batch_norm(beta = add_25_beta_0_to_fp16, epsilon = add_25_epsilon_0_to_fp16, gamma = add_25_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_49_cast_fp16)[name = tensor("add_25_cast_fp16")]; + tensor input_121_cast_fp16 = silu(x = add_25_cast_fp16)[name = tensor("input_121_cast_fp16")]; + tensor var_2277 = const()[name = tensor("op_2277"), val = tensor([1, 1])]; + tensor var_2279 = const()[name = tensor("op_2279"), val = tensor([1, 1])]; + tensor hidden_states_73_pad_type_0 = const()[name = tensor("hidden_states_73_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_73_pad_0 = const()[name = tensor("hidden_states_73_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_2_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100794176)))]; + tensor down_blocks_2_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(115539840)))]; + tensor hidden_states_73_cast_fp16 = conv(bias = down_blocks_2_resnets_0_conv1_bias_to_fp16, dilations = var_2279, groups = var_2254, pad = hidden_states_73_pad_0, pad_type = hidden_states_73_pad_type_0, strides = var_2277, weight = down_blocks_2_resnets_0_conv1_weight_to_fp16, x = input_121_cast_fp16)[name = tensor("hidden_states_73_cast_fp16")]; + tensor var_2285 = const()[name = tensor("op_2285"), val = tensor([1, 1])]; + tensor var_2287 = const()[name = tensor("op_2287"), val = tensor([1, 1])]; + tensor temb_9_pad_type_0 = const()[name = tensor("temb_9_pad_type_0"), val = tensor("custom")]; + tensor temb_9_pad_0 = const()[name = tensor("temb_9_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(115542464)))]; + tensor down_blocks_2_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118819328)))]; + tensor temb_9_cast_fp16 = conv(bias = down_blocks_2_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_2287, groups = var_2254, pad = temb_9_pad_0, pad_type = temb_9_pad_type_0, strides = var_2285, weight = down_blocks_2_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_9_cast_fp16")]; + tensor input_125_cast_fp16 = add(x = hidden_states_73_cast_fp16, y = temb_9_cast_fp16)[name = tensor("input_125_cast_fp16")]; + tensor reshape_52_shape_0 = const()[name = tensor("reshape_52_shape_0"), val = tensor([2, 32, 40, 12, 12])]; + tensor reshape_52_cast_fp16 = reshape(shape = reshape_52_shape_0, x = input_125_cast_fp16)[name = tensor("reshape_52_cast_fp16")]; + tensor reduce_mean_39_axes_0 = const()[name = tensor("reduce_mean_39_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_39_keep_dims_0 = const()[name = tensor("reduce_mean_39_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_39_cast_fp16 = reduce_mean(axes = reduce_mean_39_axes_0, keep_dims = reduce_mean_39_keep_dims_0, x = reshape_52_cast_fp16)[name = tensor("reduce_mean_39_cast_fp16")]; + tensor sub_26_cast_fp16 = sub(x = reshape_52_cast_fp16, y = reduce_mean_39_cast_fp16)[name = tensor("sub_26_cast_fp16")]; + tensor square_13_cast_fp16 = square(x = sub_26_cast_fp16)[name = tensor("square_13_cast_fp16")]; + tensor reduce_mean_41_axes_0 = const()[name = tensor("reduce_mean_41_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_41_keep_dims_0 = const()[name = tensor("reduce_mean_41_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_41_cast_fp16 = reduce_mean(axes = reduce_mean_41_axes_0, keep_dims = reduce_mean_41_keep_dims_0, x = square_13_cast_fp16)[name = tensor("reduce_mean_41_cast_fp16")]; + tensor add_26_y_0_to_fp16 = const()[name = tensor("add_26_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_26_cast_fp16 = add(x = reduce_mean_41_cast_fp16, y = add_26_y_0_to_fp16)[name = tensor("add_26_cast_fp16")]; + tensor sqrt_13_cast_fp16 = sqrt(x = add_26_cast_fp16)[name = tensor("sqrt_13_cast_fp16")]; + tensor real_div_13_cast_fp16 = real_div(x = sub_26_cast_fp16, y = sqrt_13_cast_fp16)[name = tensor("real_div_13_cast_fp16")]; + tensor reshape_53_shape_0 = const()[name = tensor("reshape_53_shape_0"), val = tensor([2, 1280, 12, 12])]; + tensor reshape_53_cast_fp16 = reshape(shape = reshape_53_shape_0, x = real_div_13_cast_fp16)[name = tensor("reshape_53_cast_fp16")]; + tensor add_27_mean_0_to_fp16 = const()[name = tensor("add_27_mean_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118821952)))]; + tensor add_27_variance_0_to_fp16 = const()[name = tensor("add_27_variance_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118824576)))]; + tensor add_27_gamma_0_to_fp16 = const()[name = tensor("add_27_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118827200)))]; + tensor add_27_beta_0_to_fp16 = const()[name = tensor("add_27_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118829824)))]; + tensor add_27_epsilon_0_to_fp16 = const()[name = tensor("add_27_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_27_cast_fp16 = batch_norm(beta = add_27_beta_0_to_fp16, epsilon = add_27_epsilon_0_to_fp16, gamma = add_27_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_53_cast_fp16)[name = tensor("add_27_cast_fp16")]; + tensor input_129_cast_fp16 = silu(x = add_27_cast_fp16)[name = tensor("input_129_cast_fp16")]; + tensor var_2297 = const()[name = tensor("op_2297"), val = tensor([1, 1])]; + tensor var_2299 = const()[name = tensor("op_2299"), val = tensor([1, 1])]; + tensor hidden_states_75_pad_type_0 = const()[name = tensor("hidden_states_75_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_75_pad_0 = const()[name = tensor("hidden_states_75_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_2_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118832448)))]; + tensor down_blocks_2_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148323712)))]; + tensor hidden_states_75_cast_fp16 = conv(bias = down_blocks_2_resnets_0_conv2_bias_to_fp16, dilations = var_2299, groups = var_2254, pad = hidden_states_75_pad_0, pad_type = hidden_states_75_pad_type_0, strides = var_2297, weight = down_blocks_2_resnets_0_conv2_weight_to_fp16, x = input_129_cast_fp16)[name = tensor("hidden_states_75_cast_fp16")]; + tensor var_2304 = const()[name = tensor("op_2304"), val = tensor([1, 1])]; + tensor var_2306 = const()[name = tensor("op_2306"), val = tensor([1, 1])]; + tensor x_3_pad_type_0 = const()[name = tensor("x_3_pad_type_0"), val = tensor("custom")]; + tensor x_3_pad_0 = const()[name = tensor("x_3_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_resnets_0_conv_shortcut_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148326336)))]; + tensor down_blocks_2_resnets_0_conv_shortcut_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(149964800)))]; + tensor x_3_cast_fp16 = conv(bias = down_blocks_2_resnets_0_conv_shortcut_bias_to_fp16, dilations = var_2306, groups = var_2254, pad = x_3_pad_0, pad_type = x_3_pad_type_0, strides = var_2304, weight = down_blocks_2_resnets_0_conv_shortcut_weight_to_fp16, x = input_117_cast_fp16)[name = tensor("x_3_cast_fp16")]; + tensor hidden_states_77_cast_fp16 = add(x = x_3_cast_fp16, y = hidden_states_75_cast_fp16)[name = tensor("hidden_states_77_cast_fp16")]; + tensor reshape_56_shape_0 = const()[name = tensor("reshape_56_shape_0"), val = tensor([2, 32, 40, 12, 12])]; + tensor reshape_56_cast_fp16 = reshape(shape = reshape_56_shape_0, x = hidden_states_77_cast_fp16)[name = tensor("reshape_56_cast_fp16")]; + tensor reduce_mean_42_axes_0 = const()[name = tensor("reduce_mean_42_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_42_keep_dims_0 = const()[name = tensor("reduce_mean_42_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_42_cast_fp16 = reduce_mean(axes = reduce_mean_42_axes_0, keep_dims = reduce_mean_42_keep_dims_0, x = reshape_56_cast_fp16)[name = tensor("reduce_mean_42_cast_fp16")]; + tensor sub_28_cast_fp16 = sub(x = reshape_56_cast_fp16, y = reduce_mean_42_cast_fp16)[name = tensor("sub_28_cast_fp16")]; + tensor square_14_cast_fp16 = square(x = sub_28_cast_fp16)[name = tensor("square_14_cast_fp16")]; + tensor reduce_mean_44_axes_0 = const()[name = tensor("reduce_mean_44_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_44_keep_dims_0 = const()[name = tensor("reduce_mean_44_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_44_cast_fp16 = reduce_mean(axes = reduce_mean_44_axes_0, keep_dims = reduce_mean_44_keep_dims_0, x = square_14_cast_fp16)[name = tensor("reduce_mean_44_cast_fp16")]; + tensor add_28_y_0_to_fp16 = const()[name = tensor("add_28_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_28_cast_fp16 = add(x = reduce_mean_44_cast_fp16, y = add_28_y_0_to_fp16)[name = tensor("add_28_cast_fp16")]; + tensor sqrt_14_cast_fp16 = sqrt(x = add_28_cast_fp16)[name = tensor("sqrt_14_cast_fp16")]; + tensor real_div_14_cast_fp16 = real_div(x = sub_28_cast_fp16, y = sqrt_14_cast_fp16)[name = tensor("real_div_14_cast_fp16")]; + tensor reshape_57_shape_0 = const()[name = tensor("reshape_57_shape_0"), val = tensor([2, 1280, 12, 12])]; + tensor reshape_57_cast_fp16 = reshape(shape = reshape_57_shape_0, x = real_div_14_cast_fp16)[name = tensor("reshape_57_cast_fp16")]; + tensor add_29_gamma_0_to_fp16 = const()[name = tensor("add_29_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(149967424)))]; + tensor add_29_beta_0_to_fp16 = const()[name = tensor("add_29_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(149970048)))]; + tensor add_29_epsilon_0_to_fp16 = const()[name = tensor("add_29_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_29_cast_fp16 = batch_norm(beta = add_29_beta_0_to_fp16, epsilon = add_29_epsilon_0_to_fp16, gamma = add_29_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_57_cast_fp16)[name = tensor("add_29_cast_fp16")]; + tensor var_2326 = const()[name = tensor("op_2326"), val = tensor([1, 1])]; + tensor var_2328 = const()[name = tensor("op_2328"), val = tensor([1, 1])]; + tensor hidden_states_79_pad_type_0 = const()[name = tensor("hidden_states_79_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_79_pad_0 = const()[name = tensor("hidden_states_79_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(149972672)))]; + tensor down_blocks_2_attentions_0_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153249536)))]; + tensor hidden_states_79_cast_fp16 = conv(bias = down_blocks_2_attentions_0_proj_in_bias_to_fp16, dilations = var_2328, groups = var_2254, pad = hidden_states_79_pad_0, pad_type = hidden_states_79_pad_type_0, strides = var_2326, weight = down_blocks_2_attentions_0_proj_in_weight_to_fp16, x = add_29_cast_fp16)[name = tensor("hidden_states_79_cast_fp16")]; + tensor var_2333 = const()[name = tensor("op_2333"), val = tensor([2, 1280, 1, 144])]; + tensor inputs_25_cast_fp16 = reshape(shape = var_2333, x = hidden_states_79_cast_fp16)[name = tensor("inputs_25_cast_fp16")]; + tensor var_2343 = const()[name = tensor("op_2343"), val = tensor([1])]; + tensor channels_mean_25_cast_fp16 = reduce_mean(axes = var_2343, keep_dims = var_2249, x = inputs_25_cast_fp16)[name = tensor("channels_mean_25_cast_fp16")]; + tensor zero_mean_25_cast_fp16 = sub(x = inputs_25_cast_fp16, y = channels_mean_25_cast_fp16)[name = tensor("zero_mean_25_cast_fp16")]; + tensor zero_mean_sq_25_cast_fp16 = mul(x = zero_mean_25_cast_fp16, y = zero_mean_25_cast_fp16)[name = tensor("zero_mean_sq_25_cast_fp16")]; + tensor var_2347 = const()[name = tensor("op_2347"), val = tensor([1])]; + tensor var_2348_cast_fp16 = reduce_mean(axes = var_2347, keep_dims = var_2249, x = zero_mean_sq_25_cast_fp16)[name = tensor("op_2348_cast_fp16")]; + tensor var_2349_to_fp16 = const()[name = tensor("op_2349_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_2350_cast_fp16 = add(x = var_2348_cast_fp16, y = var_2349_to_fp16)[name = tensor("op_2350_cast_fp16")]; + tensor denom_25_epsilon_0_to_fp16 = const()[name = tensor("denom_25_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_25_cast_fp16 = rsqrt(epsilon = denom_25_epsilon_0_to_fp16, x = var_2350_cast_fp16)[name = tensor("denom_25_cast_fp16")]; + tensor out_25_cast_fp16 = mul(x = zero_mean_25_cast_fp16, y = denom_25_cast_fp16)[name = tensor("out_25_cast_fp16")]; + tensor var_2354_to_fp16 = const()[name = tensor("op_2354_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153252160)))]; + tensor var_2355_cast_fp16 = add(x = out_25_cast_fp16, y = var_2354_to_fp16)[name = tensor("op_2355_cast_fp16")]; + tensor var_2357_to_fp16 = const()[name = tensor("op_2357_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153254784)))]; + tensor hidden_states_81_cast_fp16 = mul(x = var_2355_cast_fp16, y = var_2357_to_fp16)[name = tensor("hidden_states_81_cast_fp16")]; + tensor var_2364 = const()[name = tensor("op_2364"), val = tensor([1, 1])]; + tensor var_2366 = const()[name = tensor("op_2366"), val = tensor([1, 1])]; + tensor q_17_pad_type_0 = const()[name = tensor("q_17_pad_type_0"), val = tensor("custom")]; + tensor q_17_pad_0 = const()[name = tensor("q_17_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153257408)))]; + tensor q_17_cast_fp16 = conv(dilations = var_2366, groups = var_2254, pad = q_17_pad_0, pad_type = q_17_pad_type_0, strides = var_2364, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_81_cast_fp16)[name = tensor("q_17_cast_fp16")]; + tensor var_2370 = const()[name = tensor("op_2370"), val = tensor([1, 1])]; + tensor var_2372 = const()[name = tensor("op_2372"), val = tensor([1, 1])]; + tensor k_33_pad_type_0 = const()[name = tensor("k_33_pad_type_0"), val = tensor("custom")]; + tensor k_33_pad_0 = const()[name = tensor("k_33_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156534272)))]; + tensor k_33_cast_fp16 = conv(dilations = var_2372, groups = var_2254, pad = k_33_pad_0, pad_type = k_33_pad_type_0, strides = var_2370, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_81_cast_fp16)[name = tensor("k_33_cast_fp16")]; + tensor var_2376 = const()[name = tensor("op_2376"), val = tensor([1, 1])]; + tensor var_2378 = const()[name = tensor("op_2378"), val = tensor([1, 1])]; + tensor v_17_pad_type_0 = const()[name = tensor("v_17_pad_type_0"), val = tensor("custom")]; + tensor v_17_pad_0 = const()[name = tensor("v_17_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159811136)))]; + tensor v_17_cast_fp16 = conv(dilations = var_2378, groups = var_2254, pad = v_17_pad_0, pad_type = v_17_pad_type_0, strides = var_2376, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_81_cast_fp16)[name = tensor("v_17_cast_fp16")]; + tensor var_2382_begin_0 = const()[name = tensor("op_2382_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_2382_end_0 = const()[name = tensor("op_2382_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_2382_end_mask_0 = const()[name = tensor("op_2382_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2382_cast_fp16 = slice_by_index(begin = var_2382_begin_0, end = var_2382_end_0, end_mask = var_2382_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2382_cast_fp16")]; + tensor var_2386_begin_0 = const()[name = tensor("op_2386_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_2386_end_0 = const()[name = tensor("op_2386_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_2386_end_mask_0 = const()[name = tensor("op_2386_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2386_cast_fp16 = slice_by_index(begin = var_2386_begin_0, end = var_2386_end_0, end_mask = var_2386_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2386_cast_fp16")]; + tensor var_2390_begin_0 = const()[name = tensor("op_2390_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_2390_end_0 = const()[name = tensor("op_2390_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_2390_end_mask_0 = const()[name = tensor("op_2390_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2390_cast_fp16 = slice_by_index(begin = var_2390_begin_0, end = var_2390_end_0, end_mask = var_2390_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2390_cast_fp16")]; + tensor var_2394_begin_0 = const()[name = tensor("op_2394_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_2394_end_0 = const()[name = tensor("op_2394_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_2394_end_mask_0 = const()[name = tensor("op_2394_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2394_cast_fp16 = slice_by_index(begin = var_2394_begin_0, end = var_2394_end_0, end_mask = var_2394_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2394_cast_fp16")]; + tensor var_2398_begin_0 = const()[name = tensor("op_2398_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_2398_end_0 = const()[name = tensor("op_2398_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_2398_end_mask_0 = const()[name = tensor("op_2398_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2398_cast_fp16 = slice_by_index(begin = var_2398_begin_0, end = var_2398_end_0, end_mask = var_2398_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2398_cast_fp16")]; + tensor var_2402_begin_0 = const()[name = tensor("op_2402_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_2402_end_0 = const()[name = tensor("op_2402_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_2402_end_mask_0 = const()[name = tensor("op_2402_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2402_cast_fp16 = slice_by_index(begin = var_2402_begin_0, end = var_2402_end_0, end_mask = var_2402_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2402_cast_fp16")]; + tensor var_2406_begin_0 = const()[name = tensor("op_2406_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_2406_end_0 = const()[name = tensor("op_2406_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_2406_end_mask_0 = const()[name = tensor("op_2406_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2406_cast_fp16 = slice_by_index(begin = var_2406_begin_0, end = var_2406_end_0, end_mask = var_2406_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2406_cast_fp16")]; + tensor var_2410_begin_0 = const()[name = tensor("op_2410_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_2410_end_0 = const()[name = tensor("op_2410_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_2410_end_mask_0 = const()[name = tensor("op_2410_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2410_cast_fp16 = slice_by_index(begin = var_2410_begin_0, end = var_2410_end_0, end_mask = var_2410_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2410_cast_fp16")]; + tensor var_2414_begin_0 = const()[name = tensor("op_2414_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_2414_end_0 = const()[name = tensor("op_2414_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_2414_end_mask_0 = const()[name = tensor("op_2414_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2414_cast_fp16 = slice_by_index(begin = var_2414_begin_0, end = var_2414_end_0, end_mask = var_2414_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2414_cast_fp16")]; + tensor var_2418_begin_0 = const()[name = tensor("op_2418_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_2418_end_0 = const()[name = tensor("op_2418_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_2418_end_mask_0 = const()[name = tensor("op_2418_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2418_cast_fp16 = slice_by_index(begin = var_2418_begin_0, end = var_2418_end_0, end_mask = var_2418_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2418_cast_fp16")]; + tensor var_2422_begin_0 = const()[name = tensor("op_2422_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_2422_end_0 = const()[name = tensor("op_2422_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_2422_end_mask_0 = const()[name = tensor("op_2422_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2422_cast_fp16 = slice_by_index(begin = var_2422_begin_0, end = var_2422_end_0, end_mask = var_2422_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2422_cast_fp16")]; + tensor var_2426_begin_0 = const()[name = tensor("op_2426_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_2426_end_0 = const()[name = tensor("op_2426_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_2426_end_mask_0 = const()[name = tensor("op_2426_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2426_cast_fp16 = slice_by_index(begin = var_2426_begin_0, end = var_2426_end_0, end_mask = var_2426_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2426_cast_fp16")]; + tensor var_2430_begin_0 = const()[name = tensor("op_2430_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_2430_end_0 = const()[name = tensor("op_2430_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_2430_end_mask_0 = const()[name = tensor("op_2430_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2430_cast_fp16 = slice_by_index(begin = var_2430_begin_0, end = var_2430_end_0, end_mask = var_2430_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2430_cast_fp16")]; + tensor var_2434_begin_0 = const()[name = tensor("op_2434_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_2434_end_0 = const()[name = tensor("op_2434_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_2434_end_mask_0 = const()[name = tensor("op_2434_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2434_cast_fp16 = slice_by_index(begin = var_2434_begin_0, end = var_2434_end_0, end_mask = var_2434_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2434_cast_fp16")]; + tensor var_2438_begin_0 = const()[name = tensor("op_2438_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_2438_end_0 = const()[name = tensor("op_2438_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_2438_end_mask_0 = const()[name = tensor("op_2438_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2438_cast_fp16 = slice_by_index(begin = var_2438_begin_0, end = var_2438_end_0, end_mask = var_2438_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2438_cast_fp16")]; + tensor var_2442_begin_0 = const()[name = tensor("op_2442_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_2442_end_0 = const()[name = tensor("op_2442_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_2442_end_mask_0 = const()[name = tensor("op_2442_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2442_cast_fp16 = slice_by_index(begin = var_2442_begin_0, end = var_2442_end_0, end_mask = var_2442_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2442_cast_fp16")]; + tensor var_2446_begin_0 = const()[name = tensor("op_2446_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_2446_end_0 = const()[name = tensor("op_2446_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_2446_end_mask_0 = const()[name = tensor("op_2446_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2446_cast_fp16 = slice_by_index(begin = var_2446_begin_0, end = var_2446_end_0, end_mask = var_2446_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2446_cast_fp16")]; + tensor var_2450_begin_0 = const()[name = tensor("op_2450_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_2450_end_0 = const()[name = tensor("op_2450_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_2450_end_mask_0 = const()[name = tensor("op_2450_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2450_cast_fp16 = slice_by_index(begin = var_2450_begin_0, end = var_2450_end_0, end_mask = var_2450_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2450_cast_fp16")]; + tensor var_2454_begin_0 = const()[name = tensor("op_2454_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_2454_end_0 = const()[name = tensor("op_2454_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_2454_end_mask_0 = const()[name = tensor("op_2454_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2454_cast_fp16 = slice_by_index(begin = var_2454_begin_0, end = var_2454_end_0, end_mask = var_2454_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2454_cast_fp16")]; + tensor var_2458_begin_0 = const()[name = tensor("op_2458_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_2458_end_0 = const()[name = tensor("op_2458_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_2458_end_mask_0 = const()[name = tensor("op_2458_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2458_cast_fp16 = slice_by_index(begin = var_2458_begin_0, end = var_2458_end_0, end_mask = var_2458_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2458_cast_fp16")]; + tensor k_35_perm_0 = const()[name = tensor("k_35_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_2465_begin_0 = const()[name = tensor("op_2465_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_2465_end_0 = const()[name = tensor("op_2465_end_0"), val = tensor([2, 144, 1, 64])]; + tensor var_2465_end_mask_0 = const()[name = tensor("op_2465_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_23 = transpose(perm = k_35_perm_0, x = k_33_cast_fp16)[name = tensor("transpose_23")]; + tensor var_2465_cast_fp16 = slice_by_index(begin = var_2465_begin_0, end = var_2465_end_0, end_mask = var_2465_end_mask_0, x = transpose_23)[name = tensor("op_2465_cast_fp16")]; + tensor var_2469_begin_0 = const()[name = tensor("op_2469_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_2469_end_0 = const()[name = tensor("op_2469_end_0"), val = tensor([2, 144, 1, 128])]; + tensor var_2469_end_mask_0 = const()[name = tensor("op_2469_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2469_cast_fp16 = slice_by_index(begin = var_2469_begin_0, end = var_2469_end_0, end_mask = var_2469_end_mask_0, x = transpose_23)[name = tensor("op_2469_cast_fp16")]; + tensor var_2473_begin_0 = const()[name = tensor("op_2473_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_2473_end_0 = const()[name = tensor("op_2473_end_0"), val = tensor([2, 144, 1, 192])]; + tensor var_2473_end_mask_0 = const()[name = tensor("op_2473_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2473_cast_fp16 = slice_by_index(begin = var_2473_begin_0, end = var_2473_end_0, end_mask = var_2473_end_mask_0, x = transpose_23)[name = tensor("op_2473_cast_fp16")]; + tensor var_2477_begin_0 = const()[name = tensor("op_2477_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_2477_end_0 = const()[name = tensor("op_2477_end_0"), val = tensor([2, 144, 1, 256])]; + tensor var_2477_end_mask_0 = const()[name = tensor("op_2477_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2477_cast_fp16 = slice_by_index(begin = var_2477_begin_0, end = var_2477_end_0, end_mask = var_2477_end_mask_0, x = transpose_23)[name = tensor("op_2477_cast_fp16")]; + tensor var_2481_begin_0 = const()[name = tensor("op_2481_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_2481_end_0 = const()[name = tensor("op_2481_end_0"), val = tensor([2, 144, 1, 320])]; + tensor var_2481_end_mask_0 = const()[name = tensor("op_2481_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2481_cast_fp16 = slice_by_index(begin = var_2481_begin_0, end = var_2481_end_0, end_mask = var_2481_end_mask_0, x = transpose_23)[name = tensor("op_2481_cast_fp16")]; + tensor var_2485_begin_0 = const()[name = tensor("op_2485_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_2485_end_0 = const()[name = tensor("op_2485_end_0"), val = tensor([2, 144, 1, 384])]; + tensor var_2485_end_mask_0 = const()[name = tensor("op_2485_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2485_cast_fp16 = slice_by_index(begin = var_2485_begin_0, end = var_2485_end_0, end_mask = var_2485_end_mask_0, x = transpose_23)[name = tensor("op_2485_cast_fp16")]; + tensor var_2489_begin_0 = const()[name = tensor("op_2489_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_2489_end_0 = const()[name = tensor("op_2489_end_0"), val = tensor([2, 144, 1, 448])]; + tensor var_2489_end_mask_0 = const()[name = tensor("op_2489_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2489_cast_fp16 = slice_by_index(begin = var_2489_begin_0, end = var_2489_end_0, end_mask = var_2489_end_mask_0, x = transpose_23)[name = tensor("op_2489_cast_fp16")]; + tensor var_2493_begin_0 = const()[name = tensor("op_2493_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_2493_end_0 = const()[name = tensor("op_2493_end_0"), val = tensor([2, 144, 1, 512])]; + tensor var_2493_end_mask_0 = const()[name = tensor("op_2493_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2493_cast_fp16 = slice_by_index(begin = var_2493_begin_0, end = var_2493_end_0, end_mask = var_2493_end_mask_0, x = transpose_23)[name = tensor("op_2493_cast_fp16")]; + tensor var_2497_begin_0 = const()[name = tensor("op_2497_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_2497_end_0 = const()[name = tensor("op_2497_end_0"), val = tensor([2, 144, 1, 576])]; + tensor var_2497_end_mask_0 = const()[name = tensor("op_2497_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2497_cast_fp16 = slice_by_index(begin = var_2497_begin_0, end = var_2497_end_0, end_mask = var_2497_end_mask_0, x = transpose_23)[name = tensor("op_2497_cast_fp16")]; + tensor var_2501_begin_0 = const()[name = tensor("op_2501_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_2501_end_0 = const()[name = tensor("op_2501_end_0"), val = tensor([2, 144, 1, 640])]; + tensor var_2501_end_mask_0 = const()[name = tensor("op_2501_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2501_cast_fp16 = slice_by_index(begin = var_2501_begin_0, end = var_2501_end_0, end_mask = var_2501_end_mask_0, x = transpose_23)[name = tensor("op_2501_cast_fp16")]; + tensor var_2505_begin_0 = const()[name = tensor("op_2505_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_2505_end_0 = const()[name = tensor("op_2505_end_0"), val = tensor([2, 144, 1, 704])]; + tensor var_2505_end_mask_0 = const()[name = tensor("op_2505_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2505_cast_fp16 = slice_by_index(begin = var_2505_begin_0, end = var_2505_end_0, end_mask = var_2505_end_mask_0, x = transpose_23)[name = tensor("op_2505_cast_fp16")]; + tensor var_2509_begin_0 = const()[name = tensor("op_2509_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_2509_end_0 = const()[name = tensor("op_2509_end_0"), val = tensor([2, 144, 1, 768])]; + tensor var_2509_end_mask_0 = const()[name = tensor("op_2509_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2509_cast_fp16 = slice_by_index(begin = var_2509_begin_0, end = var_2509_end_0, end_mask = var_2509_end_mask_0, x = transpose_23)[name = tensor("op_2509_cast_fp16")]; + tensor var_2513_begin_0 = const()[name = tensor("op_2513_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_2513_end_0 = const()[name = tensor("op_2513_end_0"), val = tensor([2, 144, 1, 832])]; + tensor var_2513_end_mask_0 = const()[name = tensor("op_2513_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2513_cast_fp16 = slice_by_index(begin = var_2513_begin_0, end = var_2513_end_0, end_mask = var_2513_end_mask_0, x = transpose_23)[name = tensor("op_2513_cast_fp16")]; + tensor var_2517_begin_0 = const()[name = tensor("op_2517_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_2517_end_0 = const()[name = tensor("op_2517_end_0"), val = tensor([2, 144, 1, 896])]; + tensor var_2517_end_mask_0 = const()[name = tensor("op_2517_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2517_cast_fp16 = slice_by_index(begin = var_2517_begin_0, end = var_2517_end_0, end_mask = var_2517_end_mask_0, x = transpose_23)[name = tensor("op_2517_cast_fp16")]; + tensor var_2521_begin_0 = const()[name = tensor("op_2521_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_2521_end_0 = const()[name = tensor("op_2521_end_0"), val = tensor([2, 144, 1, 960])]; + tensor var_2521_end_mask_0 = const()[name = tensor("op_2521_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2521_cast_fp16 = slice_by_index(begin = var_2521_begin_0, end = var_2521_end_0, end_mask = var_2521_end_mask_0, x = transpose_23)[name = tensor("op_2521_cast_fp16")]; + tensor var_2525_begin_0 = const()[name = tensor("op_2525_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_2525_end_0 = const()[name = tensor("op_2525_end_0"), val = tensor([2, 144, 1, 1024])]; + tensor var_2525_end_mask_0 = const()[name = tensor("op_2525_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2525_cast_fp16 = slice_by_index(begin = var_2525_begin_0, end = var_2525_end_0, end_mask = var_2525_end_mask_0, x = transpose_23)[name = tensor("op_2525_cast_fp16")]; + tensor var_2529_begin_0 = const()[name = tensor("op_2529_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_2529_end_0 = const()[name = tensor("op_2529_end_0"), val = tensor([2, 144, 1, 1088])]; + tensor var_2529_end_mask_0 = const()[name = tensor("op_2529_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2529_cast_fp16 = slice_by_index(begin = var_2529_begin_0, end = var_2529_end_0, end_mask = var_2529_end_mask_0, x = transpose_23)[name = tensor("op_2529_cast_fp16")]; + tensor var_2533_begin_0 = const()[name = tensor("op_2533_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_2533_end_0 = const()[name = tensor("op_2533_end_0"), val = tensor([2, 144, 1, 1152])]; + tensor var_2533_end_mask_0 = const()[name = tensor("op_2533_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2533_cast_fp16 = slice_by_index(begin = var_2533_begin_0, end = var_2533_end_0, end_mask = var_2533_end_mask_0, x = transpose_23)[name = tensor("op_2533_cast_fp16")]; + tensor var_2537_begin_0 = const()[name = tensor("op_2537_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_2537_end_0 = const()[name = tensor("op_2537_end_0"), val = tensor([2, 144, 1, 1216])]; + tensor var_2537_end_mask_0 = const()[name = tensor("op_2537_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2537_cast_fp16 = slice_by_index(begin = var_2537_begin_0, end = var_2537_end_0, end_mask = var_2537_end_mask_0, x = transpose_23)[name = tensor("op_2537_cast_fp16")]; + tensor var_2541_begin_0 = const()[name = tensor("op_2541_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_2541_end_0 = const()[name = tensor("op_2541_end_0"), val = tensor([2, 144, 1, 1280])]; + tensor var_2541_end_mask_0 = const()[name = tensor("op_2541_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2541_cast_fp16 = slice_by_index(begin = var_2541_begin_0, end = var_2541_end_0, end_mask = var_2541_end_mask_0, x = transpose_23)[name = tensor("op_2541_cast_fp16")]; + tensor var_2543_begin_0 = const()[name = tensor("op_2543_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_2543_end_0 = const()[name = tensor("op_2543_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_2543_end_mask_0 = const()[name = tensor("op_2543_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2543_cast_fp16 = slice_by_index(begin = var_2543_begin_0, end = var_2543_end_0, end_mask = var_2543_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2543_cast_fp16")]; + tensor var_2547_begin_0 = const()[name = tensor("op_2547_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_2547_end_0 = const()[name = tensor("op_2547_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_2547_end_mask_0 = const()[name = tensor("op_2547_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2547_cast_fp16 = slice_by_index(begin = var_2547_begin_0, end = var_2547_end_0, end_mask = var_2547_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2547_cast_fp16")]; + tensor var_2551_begin_0 = const()[name = tensor("op_2551_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_2551_end_0 = const()[name = tensor("op_2551_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_2551_end_mask_0 = const()[name = tensor("op_2551_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2551_cast_fp16 = slice_by_index(begin = var_2551_begin_0, end = var_2551_end_0, end_mask = var_2551_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2551_cast_fp16")]; + tensor var_2555_begin_0 = const()[name = tensor("op_2555_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_2555_end_0 = const()[name = tensor("op_2555_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_2555_end_mask_0 = const()[name = tensor("op_2555_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2555_cast_fp16 = slice_by_index(begin = var_2555_begin_0, end = var_2555_end_0, end_mask = var_2555_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2555_cast_fp16")]; + tensor var_2559_begin_0 = const()[name = tensor("op_2559_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_2559_end_0 = const()[name = tensor("op_2559_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_2559_end_mask_0 = const()[name = tensor("op_2559_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2559_cast_fp16 = slice_by_index(begin = var_2559_begin_0, end = var_2559_end_0, end_mask = var_2559_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2559_cast_fp16")]; + tensor var_2563_begin_0 = const()[name = tensor("op_2563_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_2563_end_0 = const()[name = tensor("op_2563_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_2563_end_mask_0 = const()[name = tensor("op_2563_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2563_cast_fp16 = slice_by_index(begin = var_2563_begin_0, end = var_2563_end_0, end_mask = var_2563_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2563_cast_fp16")]; + tensor var_2567_begin_0 = const()[name = tensor("op_2567_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_2567_end_0 = const()[name = tensor("op_2567_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_2567_end_mask_0 = const()[name = tensor("op_2567_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2567_cast_fp16 = slice_by_index(begin = var_2567_begin_0, end = var_2567_end_0, end_mask = var_2567_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2567_cast_fp16")]; + tensor var_2571_begin_0 = const()[name = tensor("op_2571_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_2571_end_0 = const()[name = tensor("op_2571_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_2571_end_mask_0 = const()[name = tensor("op_2571_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2571_cast_fp16 = slice_by_index(begin = var_2571_begin_0, end = var_2571_end_0, end_mask = var_2571_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2571_cast_fp16")]; + tensor var_2575_begin_0 = const()[name = tensor("op_2575_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_2575_end_0 = const()[name = tensor("op_2575_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_2575_end_mask_0 = const()[name = tensor("op_2575_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2575_cast_fp16 = slice_by_index(begin = var_2575_begin_0, end = var_2575_end_0, end_mask = var_2575_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2575_cast_fp16")]; + tensor var_2579_begin_0 = const()[name = tensor("op_2579_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_2579_end_0 = const()[name = tensor("op_2579_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_2579_end_mask_0 = const()[name = tensor("op_2579_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2579_cast_fp16 = slice_by_index(begin = var_2579_begin_0, end = var_2579_end_0, end_mask = var_2579_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2579_cast_fp16")]; + tensor var_2583_begin_0 = const()[name = tensor("op_2583_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_2583_end_0 = const()[name = tensor("op_2583_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_2583_end_mask_0 = const()[name = tensor("op_2583_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2583_cast_fp16 = slice_by_index(begin = var_2583_begin_0, end = var_2583_end_0, end_mask = var_2583_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2583_cast_fp16")]; + tensor var_2587_begin_0 = const()[name = tensor("op_2587_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_2587_end_0 = const()[name = tensor("op_2587_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_2587_end_mask_0 = const()[name = tensor("op_2587_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2587_cast_fp16 = slice_by_index(begin = var_2587_begin_0, end = var_2587_end_0, end_mask = var_2587_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2587_cast_fp16")]; + tensor var_2591_begin_0 = const()[name = tensor("op_2591_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_2591_end_0 = const()[name = tensor("op_2591_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_2591_end_mask_0 = const()[name = tensor("op_2591_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2591_cast_fp16 = slice_by_index(begin = var_2591_begin_0, end = var_2591_end_0, end_mask = var_2591_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2591_cast_fp16")]; + tensor var_2595_begin_0 = const()[name = tensor("op_2595_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_2595_end_0 = const()[name = tensor("op_2595_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_2595_end_mask_0 = const()[name = tensor("op_2595_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2595_cast_fp16 = slice_by_index(begin = var_2595_begin_0, end = var_2595_end_0, end_mask = var_2595_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2595_cast_fp16")]; + tensor var_2599_begin_0 = const()[name = tensor("op_2599_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_2599_end_0 = const()[name = tensor("op_2599_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_2599_end_mask_0 = const()[name = tensor("op_2599_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2599_cast_fp16 = slice_by_index(begin = var_2599_begin_0, end = var_2599_end_0, end_mask = var_2599_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2599_cast_fp16")]; + tensor var_2603_begin_0 = const()[name = tensor("op_2603_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_2603_end_0 = const()[name = tensor("op_2603_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_2603_end_mask_0 = const()[name = tensor("op_2603_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2603_cast_fp16 = slice_by_index(begin = var_2603_begin_0, end = var_2603_end_0, end_mask = var_2603_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2603_cast_fp16")]; + tensor var_2607_begin_0 = const()[name = tensor("op_2607_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_2607_end_0 = const()[name = tensor("op_2607_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_2607_end_mask_0 = const()[name = tensor("op_2607_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2607_cast_fp16 = slice_by_index(begin = var_2607_begin_0, end = var_2607_end_0, end_mask = var_2607_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2607_cast_fp16")]; + tensor var_2611_begin_0 = const()[name = tensor("op_2611_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_2611_end_0 = const()[name = tensor("op_2611_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_2611_end_mask_0 = const()[name = tensor("op_2611_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2611_cast_fp16 = slice_by_index(begin = var_2611_begin_0, end = var_2611_end_0, end_mask = var_2611_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2611_cast_fp16")]; + tensor var_2615_begin_0 = const()[name = tensor("op_2615_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_2615_end_0 = const()[name = tensor("op_2615_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_2615_end_mask_0 = const()[name = tensor("op_2615_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2615_cast_fp16 = slice_by_index(begin = var_2615_begin_0, end = var_2615_end_0, end_mask = var_2615_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2615_cast_fp16")]; + tensor var_2619_begin_0 = const()[name = tensor("op_2619_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_2619_end_0 = const()[name = tensor("op_2619_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_2619_end_mask_0 = const()[name = tensor("op_2619_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2619_cast_fp16 = slice_by_index(begin = var_2619_begin_0, end = var_2619_end_0, end_mask = var_2619_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2619_cast_fp16")]; + tensor var_2623_equation_0 = const()[name = tensor("op_2623_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2623_cast_fp16 = einsum(equation = var_2623_equation_0, values = (var_2465_cast_fp16, var_2382_cast_fp16))[name = tensor("op_2623_cast_fp16")]; + tensor var_2624_to_fp16 = const()[name = tensor("op_2624_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_121_cast_fp16 = mul(x = var_2623_cast_fp16, y = var_2624_to_fp16)[name = tensor("aw_121_cast_fp16")]; + tensor var_2627_equation_0 = const()[name = tensor("op_2627_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2627_cast_fp16 = einsum(equation = var_2627_equation_0, values = (var_2469_cast_fp16, var_2386_cast_fp16))[name = tensor("op_2627_cast_fp16")]; + tensor var_2628_to_fp16 = const()[name = tensor("op_2628_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_123_cast_fp16 = mul(x = var_2627_cast_fp16, y = var_2628_to_fp16)[name = tensor("aw_123_cast_fp16")]; + tensor var_2631_equation_0 = const()[name = tensor("op_2631_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2631_cast_fp16 = einsum(equation = var_2631_equation_0, values = (var_2473_cast_fp16, var_2390_cast_fp16))[name = tensor("op_2631_cast_fp16")]; + tensor var_2632_to_fp16 = const()[name = tensor("op_2632_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_125_cast_fp16 = mul(x = var_2631_cast_fp16, y = var_2632_to_fp16)[name = tensor("aw_125_cast_fp16")]; + tensor var_2635_equation_0 = const()[name = tensor("op_2635_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2635_cast_fp16 = einsum(equation = var_2635_equation_0, values = (var_2477_cast_fp16, var_2394_cast_fp16))[name = tensor("op_2635_cast_fp16")]; + tensor var_2636_to_fp16 = const()[name = tensor("op_2636_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_127_cast_fp16 = mul(x = var_2635_cast_fp16, y = var_2636_to_fp16)[name = tensor("aw_127_cast_fp16")]; + tensor var_2639_equation_0 = const()[name = tensor("op_2639_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2639_cast_fp16 = einsum(equation = var_2639_equation_0, values = (var_2481_cast_fp16, var_2398_cast_fp16))[name = tensor("op_2639_cast_fp16")]; + tensor var_2640_to_fp16 = const()[name = tensor("op_2640_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_129_cast_fp16 = mul(x = var_2639_cast_fp16, y = var_2640_to_fp16)[name = tensor("aw_129_cast_fp16")]; + tensor var_2643_equation_0 = const()[name = tensor("op_2643_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2643_cast_fp16 = einsum(equation = var_2643_equation_0, values = (var_2485_cast_fp16, var_2402_cast_fp16))[name = tensor("op_2643_cast_fp16")]; + tensor var_2644_to_fp16 = const()[name = tensor("op_2644_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_131_cast_fp16 = mul(x = var_2643_cast_fp16, y = var_2644_to_fp16)[name = tensor("aw_131_cast_fp16")]; + tensor var_2647_equation_0 = const()[name = tensor("op_2647_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2647_cast_fp16 = einsum(equation = var_2647_equation_0, values = (var_2489_cast_fp16, var_2406_cast_fp16))[name = tensor("op_2647_cast_fp16")]; + tensor var_2648_to_fp16 = const()[name = tensor("op_2648_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_133_cast_fp16 = mul(x = var_2647_cast_fp16, y = var_2648_to_fp16)[name = tensor("aw_133_cast_fp16")]; + tensor var_2651_equation_0 = const()[name = tensor("op_2651_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2651_cast_fp16 = einsum(equation = var_2651_equation_0, values = (var_2493_cast_fp16, var_2410_cast_fp16))[name = tensor("op_2651_cast_fp16")]; + tensor var_2652_to_fp16 = const()[name = tensor("op_2652_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_135_cast_fp16 = mul(x = var_2651_cast_fp16, y = var_2652_to_fp16)[name = tensor("aw_135_cast_fp16")]; + tensor var_2655_equation_0 = const()[name = tensor("op_2655_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2655_cast_fp16 = einsum(equation = var_2655_equation_0, values = (var_2497_cast_fp16, var_2414_cast_fp16))[name = tensor("op_2655_cast_fp16")]; + tensor var_2656_to_fp16 = const()[name = tensor("op_2656_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_137_cast_fp16 = mul(x = var_2655_cast_fp16, y = var_2656_to_fp16)[name = tensor("aw_137_cast_fp16")]; + tensor var_2659_equation_0 = const()[name = tensor("op_2659_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2659_cast_fp16 = einsum(equation = var_2659_equation_0, values = (var_2501_cast_fp16, var_2418_cast_fp16))[name = tensor("op_2659_cast_fp16")]; + tensor var_2660_to_fp16 = const()[name = tensor("op_2660_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_139_cast_fp16 = mul(x = var_2659_cast_fp16, y = var_2660_to_fp16)[name = tensor("aw_139_cast_fp16")]; + tensor var_2663_equation_0 = const()[name = tensor("op_2663_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2663_cast_fp16 = einsum(equation = var_2663_equation_0, values = (var_2505_cast_fp16, var_2422_cast_fp16))[name = tensor("op_2663_cast_fp16")]; + tensor var_2664_to_fp16 = const()[name = tensor("op_2664_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_141_cast_fp16 = mul(x = var_2663_cast_fp16, y = var_2664_to_fp16)[name = tensor("aw_141_cast_fp16")]; + tensor var_2667_equation_0 = const()[name = tensor("op_2667_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2667_cast_fp16 = einsum(equation = var_2667_equation_0, values = (var_2509_cast_fp16, var_2426_cast_fp16))[name = tensor("op_2667_cast_fp16")]; + tensor var_2668_to_fp16 = const()[name = tensor("op_2668_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_143_cast_fp16 = mul(x = var_2667_cast_fp16, y = var_2668_to_fp16)[name = tensor("aw_143_cast_fp16")]; + tensor var_2671_equation_0 = const()[name = tensor("op_2671_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2671_cast_fp16 = einsum(equation = var_2671_equation_0, values = (var_2513_cast_fp16, var_2430_cast_fp16))[name = tensor("op_2671_cast_fp16")]; + tensor var_2672_to_fp16 = const()[name = tensor("op_2672_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_145_cast_fp16 = mul(x = var_2671_cast_fp16, y = var_2672_to_fp16)[name = tensor("aw_145_cast_fp16")]; + tensor var_2675_equation_0 = const()[name = tensor("op_2675_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2675_cast_fp16 = einsum(equation = var_2675_equation_0, values = (var_2517_cast_fp16, var_2434_cast_fp16))[name = tensor("op_2675_cast_fp16")]; + tensor var_2676_to_fp16 = const()[name = tensor("op_2676_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_147_cast_fp16 = mul(x = var_2675_cast_fp16, y = var_2676_to_fp16)[name = tensor("aw_147_cast_fp16")]; + tensor var_2679_equation_0 = const()[name = tensor("op_2679_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2679_cast_fp16 = einsum(equation = var_2679_equation_0, values = (var_2521_cast_fp16, var_2438_cast_fp16))[name = tensor("op_2679_cast_fp16")]; + tensor var_2680_to_fp16 = const()[name = tensor("op_2680_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_149_cast_fp16 = mul(x = var_2679_cast_fp16, y = var_2680_to_fp16)[name = tensor("aw_149_cast_fp16")]; + tensor var_2683_equation_0 = const()[name = tensor("op_2683_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2683_cast_fp16 = einsum(equation = var_2683_equation_0, values = (var_2525_cast_fp16, var_2442_cast_fp16))[name = tensor("op_2683_cast_fp16")]; + tensor var_2684_to_fp16 = const()[name = tensor("op_2684_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_151_cast_fp16 = mul(x = var_2683_cast_fp16, y = var_2684_to_fp16)[name = tensor("aw_151_cast_fp16")]; + tensor var_2687_equation_0 = const()[name = tensor("op_2687_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2687_cast_fp16 = einsum(equation = var_2687_equation_0, values = (var_2529_cast_fp16, var_2446_cast_fp16))[name = tensor("op_2687_cast_fp16")]; + tensor var_2688_to_fp16 = const()[name = tensor("op_2688_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_153_cast_fp16 = mul(x = var_2687_cast_fp16, y = var_2688_to_fp16)[name = tensor("aw_153_cast_fp16")]; + tensor var_2691_equation_0 = const()[name = tensor("op_2691_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2691_cast_fp16 = einsum(equation = var_2691_equation_0, values = (var_2533_cast_fp16, var_2450_cast_fp16))[name = tensor("op_2691_cast_fp16")]; + tensor var_2692_to_fp16 = const()[name = tensor("op_2692_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_155_cast_fp16 = mul(x = var_2691_cast_fp16, y = var_2692_to_fp16)[name = tensor("aw_155_cast_fp16")]; + tensor var_2695_equation_0 = const()[name = tensor("op_2695_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2695_cast_fp16 = einsum(equation = var_2695_equation_0, values = (var_2537_cast_fp16, var_2454_cast_fp16))[name = tensor("op_2695_cast_fp16")]; + tensor var_2696_to_fp16 = const()[name = tensor("op_2696_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_157_cast_fp16 = mul(x = var_2695_cast_fp16, y = var_2696_to_fp16)[name = tensor("aw_157_cast_fp16")]; + tensor var_2699_equation_0 = const()[name = tensor("op_2699_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_2699_cast_fp16 = einsum(equation = var_2699_equation_0, values = (var_2541_cast_fp16, var_2458_cast_fp16))[name = tensor("op_2699_cast_fp16")]; + tensor var_2700_to_fp16 = const()[name = tensor("op_2700_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_159_cast_fp16 = mul(x = var_2699_cast_fp16, y = var_2700_to_fp16)[name = tensor("aw_159_cast_fp16")]; + tensor var_2702_cast_fp16 = softmax(axis = var_2254, x = aw_121_cast_fp16)[name = tensor("op_2702_cast_fp16")]; + tensor var_2703_cast_fp16 = softmax(axis = var_2254, x = aw_123_cast_fp16)[name = tensor("op_2703_cast_fp16")]; + tensor var_2704_cast_fp16 = softmax(axis = var_2254, x = aw_125_cast_fp16)[name = tensor("op_2704_cast_fp16")]; + tensor var_2705_cast_fp16 = softmax(axis = var_2254, x = aw_127_cast_fp16)[name = tensor("op_2705_cast_fp16")]; + tensor var_2706_cast_fp16 = softmax(axis = var_2254, x = aw_129_cast_fp16)[name = tensor("op_2706_cast_fp16")]; + tensor var_2707_cast_fp16 = softmax(axis = var_2254, x = aw_131_cast_fp16)[name = tensor("op_2707_cast_fp16")]; + tensor var_2708_cast_fp16 = softmax(axis = var_2254, x = aw_133_cast_fp16)[name = tensor("op_2708_cast_fp16")]; + tensor var_2709_cast_fp16 = softmax(axis = var_2254, x = aw_135_cast_fp16)[name = tensor("op_2709_cast_fp16")]; + tensor var_2710_cast_fp16 = softmax(axis = var_2254, x = aw_137_cast_fp16)[name = tensor("op_2710_cast_fp16")]; + tensor var_2711_cast_fp16 = softmax(axis = var_2254, x = aw_139_cast_fp16)[name = tensor("op_2711_cast_fp16")]; + tensor var_2712_cast_fp16 = softmax(axis = var_2254, x = aw_141_cast_fp16)[name = tensor("op_2712_cast_fp16")]; + tensor var_2713_cast_fp16 = softmax(axis = var_2254, x = aw_143_cast_fp16)[name = tensor("op_2713_cast_fp16")]; + tensor var_2714_cast_fp16 = softmax(axis = var_2254, x = aw_145_cast_fp16)[name = tensor("op_2714_cast_fp16")]; + tensor var_2715_cast_fp16 = softmax(axis = var_2254, x = aw_147_cast_fp16)[name = tensor("op_2715_cast_fp16")]; + tensor var_2716_cast_fp16 = softmax(axis = var_2254, x = aw_149_cast_fp16)[name = tensor("op_2716_cast_fp16")]; + tensor var_2717_cast_fp16 = softmax(axis = var_2254, x = aw_151_cast_fp16)[name = tensor("op_2717_cast_fp16")]; + tensor var_2718_cast_fp16 = softmax(axis = var_2254, x = aw_153_cast_fp16)[name = tensor("op_2718_cast_fp16")]; + tensor var_2719_cast_fp16 = softmax(axis = var_2254, x = aw_155_cast_fp16)[name = tensor("op_2719_cast_fp16")]; + tensor var_2720_cast_fp16 = softmax(axis = var_2254, x = aw_157_cast_fp16)[name = tensor("op_2720_cast_fp16")]; + tensor var_2721_cast_fp16 = softmax(axis = var_2254, x = aw_159_cast_fp16)[name = tensor("op_2721_cast_fp16")]; + tensor var_2723_equation_0 = const()[name = tensor("op_2723_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2723_cast_fp16 = einsum(equation = var_2723_equation_0, values = (var_2543_cast_fp16, var_2702_cast_fp16))[name = tensor("op_2723_cast_fp16")]; + tensor var_2725_equation_0 = const()[name = tensor("op_2725_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2725_cast_fp16 = einsum(equation = var_2725_equation_0, values = (var_2547_cast_fp16, var_2703_cast_fp16))[name = tensor("op_2725_cast_fp16")]; + tensor var_2727_equation_0 = const()[name = tensor("op_2727_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2727_cast_fp16 = einsum(equation = var_2727_equation_0, values = (var_2551_cast_fp16, var_2704_cast_fp16))[name = tensor("op_2727_cast_fp16")]; + tensor var_2729_equation_0 = const()[name = tensor("op_2729_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2729_cast_fp16 = einsum(equation = var_2729_equation_0, values = (var_2555_cast_fp16, var_2705_cast_fp16))[name = tensor("op_2729_cast_fp16")]; + tensor var_2731_equation_0 = const()[name = tensor("op_2731_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2731_cast_fp16 = einsum(equation = var_2731_equation_0, values = (var_2559_cast_fp16, var_2706_cast_fp16))[name = tensor("op_2731_cast_fp16")]; + tensor var_2733_equation_0 = const()[name = tensor("op_2733_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2733_cast_fp16 = einsum(equation = var_2733_equation_0, values = (var_2563_cast_fp16, var_2707_cast_fp16))[name = tensor("op_2733_cast_fp16")]; + tensor var_2735_equation_0 = const()[name = tensor("op_2735_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2735_cast_fp16 = einsum(equation = var_2735_equation_0, values = (var_2567_cast_fp16, var_2708_cast_fp16))[name = tensor("op_2735_cast_fp16")]; + tensor var_2737_equation_0 = const()[name = tensor("op_2737_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2737_cast_fp16 = einsum(equation = var_2737_equation_0, values = (var_2571_cast_fp16, var_2709_cast_fp16))[name = tensor("op_2737_cast_fp16")]; + tensor var_2739_equation_0 = const()[name = tensor("op_2739_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2739_cast_fp16 = einsum(equation = var_2739_equation_0, values = (var_2575_cast_fp16, var_2710_cast_fp16))[name = tensor("op_2739_cast_fp16")]; + tensor var_2741_equation_0 = const()[name = tensor("op_2741_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2741_cast_fp16 = einsum(equation = var_2741_equation_0, values = (var_2579_cast_fp16, var_2711_cast_fp16))[name = tensor("op_2741_cast_fp16")]; + tensor var_2743_equation_0 = const()[name = tensor("op_2743_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2743_cast_fp16 = einsum(equation = var_2743_equation_0, values = (var_2583_cast_fp16, var_2712_cast_fp16))[name = tensor("op_2743_cast_fp16")]; + tensor var_2745_equation_0 = const()[name = tensor("op_2745_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2745_cast_fp16 = einsum(equation = var_2745_equation_0, values = (var_2587_cast_fp16, var_2713_cast_fp16))[name = tensor("op_2745_cast_fp16")]; + tensor var_2747_equation_0 = const()[name = tensor("op_2747_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2747_cast_fp16 = einsum(equation = var_2747_equation_0, values = (var_2591_cast_fp16, var_2714_cast_fp16))[name = tensor("op_2747_cast_fp16")]; + tensor var_2749_equation_0 = const()[name = tensor("op_2749_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2749_cast_fp16 = einsum(equation = var_2749_equation_0, values = (var_2595_cast_fp16, var_2715_cast_fp16))[name = tensor("op_2749_cast_fp16")]; + tensor var_2751_equation_0 = const()[name = tensor("op_2751_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2751_cast_fp16 = einsum(equation = var_2751_equation_0, values = (var_2599_cast_fp16, var_2716_cast_fp16))[name = tensor("op_2751_cast_fp16")]; + tensor var_2753_equation_0 = const()[name = tensor("op_2753_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2753_cast_fp16 = einsum(equation = var_2753_equation_0, values = (var_2603_cast_fp16, var_2717_cast_fp16))[name = tensor("op_2753_cast_fp16")]; + tensor var_2755_equation_0 = const()[name = tensor("op_2755_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2755_cast_fp16 = einsum(equation = var_2755_equation_0, values = (var_2607_cast_fp16, var_2718_cast_fp16))[name = tensor("op_2755_cast_fp16")]; + tensor var_2757_equation_0 = const()[name = tensor("op_2757_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2757_cast_fp16 = einsum(equation = var_2757_equation_0, values = (var_2611_cast_fp16, var_2719_cast_fp16))[name = tensor("op_2757_cast_fp16")]; + tensor var_2759_equation_0 = const()[name = tensor("op_2759_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2759_cast_fp16 = einsum(equation = var_2759_equation_0, values = (var_2615_cast_fp16, var_2720_cast_fp16))[name = tensor("op_2759_cast_fp16")]; + tensor var_2761_equation_0 = const()[name = tensor("op_2761_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_2761_cast_fp16 = einsum(equation = var_2761_equation_0, values = (var_2619_cast_fp16, var_2721_cast_fp16))[name = tensor("op_2761_cast_fp16")]; + tensor input_133_interleave_0 = const()[name = tensor("input_133_interleave_0"), val = tensor(false)]; + tensor input_133_cast_fp16 = concat(axis = var_2254, interleave = input_133_interleave_0, values = (var_2723_cast_fp16, var_2725_cast_fp16, var_2727_cast_fp16, var_2729_cast_fp16, var_2731_cast_fp16, var_2733_cast_fp16, var_2735_cast_fp16, var_2737_cast_fp16, var_2739_cast_fp16, var_2741_cast_fp16, var_2743_cast_fp16, var_2745_cast_fp16, var_2747_cast_fp16, var_2749_cast_fp16, var_2751_cast_fp16, var_2753_cast_fp16, var_2755_cast_fp16, var_2757_cast_fp16, var_2759_cast_fp16, var_2761_cast_fp16))[name = tensor("input_133_cast_fp16")]; + tensor var_2767 = const()[name = tensor("op_2767"), val = tensor([1, 1])]; + tensor var_2769 = const()[name = tensor("op_2769"), val = tensor([1, 1])]; + tensor var_2771_pad_type_0 = const()[name = tensor("op_2771_pad_type_0"), val = tensor("custom")]; + tensor var_2771_pad_0 = const()[name = tensor("op_2771_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163088000)))]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166364864)))]; + tensor var_2771_cast_fp16 = conv(bias = down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_2769, groups = var_2254, pad = var_2771_pad_0, pad_type = var_2771_pad_type_0, strides = var_2767, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_133_cast_fp16)[name = tensor("op_2771_cast_fp16")]; + tensor inputs_27_cast_fp16 = add(x = var_2771_cast_fp16, y = inputs_25_cast_fp16)[name = tensor("inputs_27_cast_fp16")]; + tensor var_2775 = const()[name = tensor("op_2775"), val = tensor([1])]; + tensor channels_mean_27_cast_fp16 = reduce_mean(axes = var_2775, keep_dims = var_2249, x = inputs_27_cast_fp16)[name = tensor("channels_mean_27_cast_fp16")]; + tensor zero_mean_27_cast_fp16 = sub(x = inputs_27_cast_fp16, y = channels_mean_27_cast_fp16)[name = tensor("zero_mean_27_cast_fp16")]; + tensor zero_mean_sq_27_cast_fp16 = mul(x = zero_mean_27_cast_fp16, y = zero_mean_27_cast_fp16)[name = tensor("zero_mean_sq_27_cast_fp16")]; + tensor var_2779 = const()[name = tensor("op_2779"), val = tensor([1])]; + tensor var_2780_cast_fp16 = reduce_mean(axes = var_2779, keep_dims = var_2249, x = zero_mean_sq_27_cast_fp16)[name = tensor("op_2780_cast_fp16")]; + tensor var_2781_to_fp16 = const()[name = tensor("op_2781_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_2782_cast_fp16 = add(x = var_2780_cast_fp16, y = var_2781_to_fp16)[name = tensor("op_2782_cast_fp16")]; + tensor denom_27_epsilon_0_to_fp16 = const()[name = tensor("denom_27_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_27_cast_fp16 = rsqrt(epsilon = denom_27_epsilon_0_to_fp16, x = var_2782_cast_fp16)[name = tensor("denom_27_cast_fp16")]; + tensor out_27_cast_fp16 = mul(x = zero_mean_27_cast_fp16, y = denom_27_cast_fp16)[name = tensor("out_27_cast_fp16")]; + tensor var_2786_to_fp16 = const()[name = tensor("op_2786_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166367488)))]; + tensor var_2787_cast_fp16 = add(x = out_27_cast_fp16, y = var_2786_to_fp16)[name = tensor("op_2787_cast_fp16")]; + tensor var_2789_to_fp16 = const()[name = tensor("op_2789_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166370112)))]; + tensor hidden_states_83_cast_fp16 = mul(x = var_2787_cast_fp16, y = var_2789_to_fp16)[name = tensor("hidden_states_83_cast_fp16")]; + tensor var_2796 = const()[name = tensor("op_2796"), val = tensor([1, 1])]; + tensor var_2798 = const()[name = tensor("op_2798"), val = tensor([1, 1])]; + tensor q_19_pad_type_0 = const()[name = tensor("q_19_pad_type_0"), val = tensor("custom")]; + tensor q_19_pad_0 = const()[name = tensor("q_19_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166372736)))]; + tensor q_19_cast_fp16 = conv(dilations = var_2798, groups = var_2254, pad = q_19_pad_0, pad_type = q_19_pad_type_0, strides = var_2796, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_83_cast_fp16)[name = tensor("q_19_cast_fp16")]; + tensor var_2802 = const()[name = tensor("op_2802"), val = tensor([1, 1])]; + tensor var_2804 = const()[name = tensor("op_2804"), val = tensor([1, 1])]; + tensor k_37_pad_type_0 = const()[name = tensor("k_37_pad_type_0"), val = tensor("custom")]; + tensor k_37_pad_0 = const()[name = tensor("k_37_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169649600)))]; + tensor k_37_cast_fp16 = conv(dilations = var_2804, groups = var_2254, pad = k_37_pad_0, pad_type = k_37_pad_type_0, strides = var_2802, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_37_cast_fp16")]; + tensor var_2808 = const()[name = tensor("op_2808"), val = tensor([1, 1])]; + tensor var_2810 = const()[name = tensor("op_2810"), val = tensor([1, 1])]; + tensor v_19_pad_type_0 = const()[name = tensor("v_19_pad_type_0"), val = tensor("custom")]; + tensor v_19_pad_0 = const()[name = tensor("v_19_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172271104)))]; + tensor v_19_cast_fp16 = conv(dilations = var_2810, groups = var_2254, pad = v_19_pad_0, pad_type = v_19_pad_type_0, strides = var_2808, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_19_cast_fp16")]; + tensor var_2814_begin_0 = const()[name = tensor("op_2814_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_2814_end_0 = const()[name = tensor("op_2814_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_2814_end_mask_0 = const()[name = tensor("op_2814_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2814_cast_fp16 = slice_by_index(begin = var_2814_begin_0, end = var_2814_end_0, end_mask = var_2814_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2814_cast_fp16")]; + tensor var_2818_begin_0 = const()[name = tensor("op_2818_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_2818_end_0 = const()[name = tensor("op_2818_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_2818_end_mask_0 = const()[name = tensor("op_2818_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2818_cast_fp16 = slice_by_index(begin = var_2818_begin_0, end = var_2818_end_0, end_mask = var_2818_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2818_cast_fp16")]; + tensor var_2822_begin_0 = const()[name = tensor("op_2822_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_2822_end_0 = const()[name = tensor("op_2822_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_2822_end_mask_0 = const()[name = tensor("op_2822_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2822_cast_fp16 = slice_by_index(begin = var_2822_begin_0, end = var_2822_end_0, end_mask = var_2822_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2822_cast_fp16")]; + tensor var_2826_begin_0 = const()[name = tensor("op_2826_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_2826_end_0 = const()[name = tensor("op_2826_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_2826_end_mask_0 = const()[name = tensor("op_2826_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2826_cast_fp16 = slice_by_index(begin = var_2826_begin_0, end = var_2826_end_0, end_mask = var_2826_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2826_cast_fp16")]; + tensor var_2830_begin_0 = const()[name = tensor("op_2830_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_2830_end_0 = const()[name = tensor("op_2830_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_2830_end_mask_0 = const()[name = tensor("op_2830_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2830_cast_fp16 = slice_by_index(begin = var_2830_begin_0, end = var_2830_end_0, end_mask = var_2830_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2830_cast_fp16")]; + tensor var_2834_begin_0 = const()[name = tensor("op_2834_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_2834_end_0 = const()[name = tensor("op_2834_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_2834_end_mask_0 = const()[name = tensor("op_2834_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2834_cast_fp16 = slice_by_index(begin = var_2834_begin_0, end = var_2834_end_0, end_mask = var_2834_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2834_cast_fp16")]; + tensor var_2838_begin_0 = const()[name = tensor("op_2838_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_2838_end_0 = const()[name = tensor("op_2838_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_2838_end_mask_0 = const()[name = tensor("op_2838_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2838_cast_fp16 = slice_by_index(begin = var_2838_begin_0, end = var_2838_end_0, end_mask = var_2838_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2838_cast_fp16")]; + tensor var_2842_begin_0 = const()[name = tensor("op_2842_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_2842_end_0 = const()[name = tensor("op_2842_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_2842_end_mask_0 = const()[name = tensor("op_2842_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2842_cast_fp16 = slice_by_index(begin = var_2842_begin_0, end = var_2842_end_0, end_mask = var_2842_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2842_cast_fp16")]; + tensor var_2846_begin_0 = const()[name = tensor("op_2846_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_2846_end_0 = const()[name = tensor("op_2846_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_2846_end_mask_0 = const()[name = tensor("op_2846_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2846_cast_fp16 = slice_by_index(begin = var_2846_begin_0, end = var_2846_end_0, end_mask = var_2846_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2846_cast_fp16")]; + tensor var_2850_begin_0 = const()[name = tensor("op_2850_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_2850_end_0 = const()[name = tensor("op_2850_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_2850_end_mask_0 = const()[name = tensor("op_2850_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2850_cast_fp16 = slice_by_index(begin = var_2850_begin_0, end = var_2850_end_0, end_mask = var_2850_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2850_cast_fp16")]; + tensor var_2854_begin_0 = const()[name = tensor("op_2854_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_2854_end_0 = const()[name = tensor("op_2854_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_2854_end_mask_0 = const()[name = tensor("op_2854_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2854_cast_fp16 = slice_by_index(begin = var_2854_begin_0, end = var_2854_end_0, end_mask = var_2854_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2854_cast_fp16")]; + tensor var_2858_begin_0 = const()[name = tensor("op_2858_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_2858_end_0 = const()[name = tensor("op_2858_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_2858_end_mask_0 = const()[name = tensor("op_2858_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2858_cast_fp16 = slice_by_index(begin = var_2858_begin_0, end = var_2858_end_0, end_mask = var_2858_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2858_cast_fp16")]; + tensor var_2862_begin_0 = const()[name = tensor("op_2862_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_2862_end_0 = const()[name = tensor("op_2862_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_2862_end_mask_0 = const()[name = tensor("op_2862_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2862_cast_fp16 = slice_by_index(begin = var_2862_begin_0, end = var_2862_end_0, end_mask = var_2862_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2862_cast_fp16")]; + tensor var_2866_begin_0 = const()[name = tensor("op_2866_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_2866_end_0 = const()[name = tensor("op_2866_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_2866_end_mask_0 = const()[name = tensor("op_2866_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2866_cast_fp16 = slice_by_index(begin = var_2866_begin_0, end = var_2866_end_0, end_mask = var_2866_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2866_cast_fp16")]; + tensor var_2870_begin_0 = const()[name = tensor("op_2870_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_2870_end_0 = const()[name = tensor("op_2870_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_2870_end_mask_0 = const()[name = tensor("op_2870_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2870_cast_fp16 = slice_by_index(begin = var_2870_begin_0, end = var_2870_end_0, end_mask = var_2870_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2870_cast_fp16")]; + tensor var_2874_begin_0 = const()[name = tensor("op_2874_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_2874_end_0 = const()[name = tensor("op_2874_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_2874_end_mask_0 = const()[name = tensor("op_2874_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2874_cast_fp16 = slice_by_index(begin = var_2874_begin_0, end = var_2874_end_0, end_mask = var_2874_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2874_cast_fp16")]; + tensor var_2878_begin_0 = const()[name = tensor("op_2878_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_2878_end_0 = const()[name = tensor("op_2878_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_2878_end_mask_0 = const()[name = tensor("op_2878_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2878_cast_fp16 = slice_by_index(begin = var_2878_begin_0, end = var_2878_end_0, end_mask = var_2878_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2878_cast_fp16")]; + tensor var_2882_begin_0 = const()[name = tensor("op_2882_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_2882_end_0 = const()[name = tensor("op_2882_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_2882_end_mask_0 = const()[name = tensor("op_2882_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2882_cast_fp16 = slice_by_index(begin = var_2882_begin_0, end = var_2882_end_0, end_mask = var_2882_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2882_cast_fp16")]; + tensor var_2886_begin_0 = const()[name = tensor("op_2886_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_2886_end_0 = const()[name = tensor("op_2886_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_2886_end_mask_0 = const()[name = tensor("op_2886_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2886_cast_fp16 = slice_by_index(begin = var_2886_begin_0, end = var_2886_end_0, end_mask = var_2886_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2886_cast_fp16")]; + tensor var_2890_begin_0 = const()[name = tensor("op_2890_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_2890_end_0 = const()[name = tensor("op_2890_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_2890_end_mask_0 = const()[name = tensor("op_2890_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2890_cast_fp16 = slice_by_index(begin = var_2890_begin_0, end = var_2890_end_0, end_mask = var_2890_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2890_cast_fp16")]; + tensor k_39_perm_0 = const()[name = tensor("k_39_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_2897_begin_0 = const()[name = tensor("op_2897_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_2897_end_0 = const()[name = tensor("op_2897_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_2897_end_mask_0 = const()[name = tensor("op_2897_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_22 = transpose(perm = k_39_perm_0, x = k_37_cast_fp16)[name = tensor("transpose_22")]; + tensor var_2897_cast_fp16 = slice_by_index(begin = var_2897_begin_0, end = var_2897_end_0, end_mask = var_2897_end_mask_0, x = transpose_22)[name = tensor("op_2897_cast_fp16")]; + tensor var_2901_begin_0 = const()[name = tensor("op_2901_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_2901_end_0 = const()[name = tensor("op_2901_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_2901_end_mask_0 = const()[name = tensor("op_2901_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2901_cast_fp16 = slice_by_index(begin = var_2901_begin_0, end = var_2901_end_0, end_mask = var_2901_end_mask_0, x = transpose_22)[name = tensor("op_2901_cast_fp16")]; + tensor var_2905_begin_0 = const()[name = tensor("op_2905_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_2905_end_0 = const()[name = tensor("op_2905_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_2905_end_mask_0 = const()[name = tensor("op_2905_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2905_cast_fp16 = slice_by_index(begin = var_2905_begin_0, end = var_2905_end_0, end_mask = var_2905_end_mask_0, x = transpose_22)[name = tensor("op_2905_cast_fp16")]; + tensor var_2909_begin_0 = const()[name = tensor("op_2909_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_2909_end_0 = const()[name = tensor("op_2909_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_2909_end_mask_0 = const()[name = tensor("op_2909_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2909_cast_fp16 = slice_by_index(begin = var_2909_begin_0, end = var_2909_end_0, end_mask = var_2909_end_mask_0, x = transpose_22)[name = tensor("op_2909_cast_fp16")]; + tensor var_2913_begin_0 = const()[name = tensor("op_2913_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_2913_end_0 = const()[name = tensor("op_2913_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_2913_end_mask_0 = const()[name = tensor("op_2913_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2913_cast_fp16 = slice_by_index(begin = var_2913_begin_0, end = var_2913_end_0, end_mask = var_2913_end_mask_0, x = transpose_22)[name = tensor("op_2913_cast_fp16")]; + tensor var_2917_begin_0 = const()[name = tensor("op_2917_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_2917_end_0 = const()[name = tensor("op_2917_end_0"), val = tensor([2, 77, 1, 384])]; + tensor var_2917_end_mask_0 = const()[name = tensor("op_2917_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2917_cast_fp16 = slice_by_index(begin = var_2917_begin_0, end = var_2917_end_0, end_mask = var_2917_end_mask_0, x = transpose_22)[name = tensor("op_2917_cast_fp16")]; + tensor var_2921_begin_0 = const()[name = tensor("op_2921_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_2921_end_0 = const()[name = tensor("op_2921_end_0"), val = tensor([2, 77, 1, 448])]; + tensor var_2921_end_mask_0 = const()[name = tensor("op_2921_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2921_cast_fp16 = slice_by_index(begin = var_2921_begin_0, end = var_2921_end_0, end_mask = var_2921_end_mask_0, x = transpose_22)[name = tensor("op_2921_cast_fp16")]; + tensor var_2925_begin_0 = const()[name = tensor("op_2925_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_2925_end_0 = const()[name = tensor("op_2925_end_0"), val = tensor([2, 77, 1, 512])]; + tensor var_2925_end_mask_0 = const()[name = tensor("op_2925_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2925_cast_fp16 = slice_by_index(begin = var_2925_begin_0, end = var_2925_end_0, end_mask = var_2925_end_mask_0, x = transpose_22)[name = tensor("op_2925_cast_fp16")]; + tensor var_2929_begin_0 = const()[name = tensor("op_2929_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_2929_end_0 = const()[name = tensor("op_2929_end_0"), val = tensor([2, 77, 1, 576])]; + tensor var_2929_end_mask_0 = const()[name = tensor("op_2929_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2929_cast_fp16 = slice_by_index(begin = var_2929_begin_0, end = var_2929_end_0, end_mask = var_2929_end_mask_0, x = transpose_22)[name = tensor("op_2929_cast_fp16")]; + tensor var_2933_begin_0 = const()[name = tensor("op_2933_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_2933_end_0 = const()[name = tensor("op_2933_end_0"), val = tensor([2, 77, 1, 640])]; + tensor var_2933_end_mask_0 = const()[name = tensor("op_2933_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2933_cast_fp16 = slice_by_index(begin = var_2933_begin_0, end = var_2933_end_0, end_mask = var_2933_end_mask_0, x = transpose_22)[name = tensor("op_2933_cast_fp16")]; + tensor var_2937_begin_0 = const()[name = tensor("op_2937_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_2937_end_0 = const()[name = tensor("op_2937_end_0"), val = tensor([2, 77, 1, 704])]; + tensor var_2937_end_mask_0 = const()[name = tensor("op_2937_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2937_cast_fp16 = slice_by_index(begin = var_2937_begin_0, end = var_2937_end_0, end_mask = var_2937_end_mask_0, x = transpose_22)[name = tensor("op_2937_cast_fp16")]; + tensor var_2941_begin_0 = const()[name = tensor("op_2941_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_2941_end_0 = const()[name = tensor("op_2941_end_0"), val = tensor([2, 77, 1, 768])]; + tensor var_2941_end_mask_0 = const()[name = tensor("op_2941_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2941_cast_fp16 = slice_by_index(begin = var_2941_begin_0, end = var_2941_end_0, end_mask = var_2941_end_mask_0, x = transpose_22)[name = tensor("op_2941_cast_fp16")]; + tensor var_2945_begin_0 = const()[name = tensor("op_2945_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_2945_end_0 = const()[name = tensor("op_2945_end_0"), val = tensor([2, 77, 1, 832])]; + tensor var_2945_end_mask_0 = const()[name = tensor("op_2945_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2945_cast_fp16 = slice_by_index(begin = var_2945_begin_0, end = var_2945_end_0, end_mask = var_2945_end_mask_0, x = transpose_22)[name = tensor("op_2945_cast_fp16")]; + tensor var_2949_begin_0 = const()[name = tensor("op_2949_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_2949_end_0 = const()[name = tensor("op_2949_end_0"), val = tensor([2, 77, 1, 896])]; + tensor var_2949_end_mask_0 = const()[name = tensor("op_2949_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2949_cast_fp16 = slice_by_index(begin = var_2949_begin_0, end = var_2949_end_0, end_mask = var_2949_end_mask_0, x = transpose_22)[name = tensor("op_2949_cast_fp16")]; + tensor var_2953_begin_0 = const()[name = tensor("op_2953_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_2953_end_0 = const()[name = tensor("op_2953_end_0"), val = tensor([2, 77, 1, 960])]; + tensor var_2953_end_mask_0 = const()[name = tensor("op_2953_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2953_cast_fp16 = slice_by_index(begin = var_2953_begin_0, end = var_2953_end_0, end_mask = var_2953_end_mask_0, x = transpose_22)[name = tensor("op_2953_cast_fp16")]; + tensor var_2957_begin_0 = const()[name = tensor("op_2957_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_2957_end_0 = const()[name = tensor("op_2957_end_0"), val = tensor([2, 77, 1, 1024])]; + tensor var_2957_end_mask_0 = const()[name = tensor("op_2957_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2957_cast_fp16 = slice_by_index(begin = var_2957_begin_0, end = var_2957_end_0, end_mask = var_2957_end_mask_0, x = transpose_22)[name = tensor("op_2957_cast_fp16")]; + tensor var_2961_begin_0 = const()[name = tensor("op_2961_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_2961_end_0 = const()[name = tensor("op_2961_end_0"), val = tensor([2, 77, 1, 1088])]; + tensor var_2961_end_mask_0 = const()[name = tensor("op_2961_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2961_cast_fp16 = slice_by_index(begin = var_2961_begin_0, end = var_2961_end_0, end_mask = var_2961_end_mask_0, x = transpose_22)[name = tensor("op_2961_cast_fp16")]; + tensor var_2965_begin_0 = const()[name = tensor("op_2965_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_2965_end_0 = const()[name = tensor("op_2965_end_0"), val = tensor([2, 77, 1, 1152])]; + tensor var_2965_end_mask_0 = const()[name = tensor("op_2965_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2965_cast_fp16 = slice_by_index(begin = var_2965_begin_0, end = var_2965_end_0, end_mask = var_2965_end_mask_0, x = transpose_22)[name = tensor("op_2965_cast_fp16")]; + tensor var_2969_begin_0 = const()[name = tensor("op_2969_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_2969_end_0 = const()[name = tensor("op_2969_end_0"), val = tensor([2, 77, 1, 1216])]; + tensor var_2969_end_mask_0 = const()[name = tensor("op_2969_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2969_cast_fp16 = slice_by_index(begin = var_2969_begin_0, end = var_2969_end_0, end_mask = var_2969_end_mask_0, x = transpose_22)[name = tensor("op_2969_cast_fp16")]; + tensor var_2973_begin_0 = const()[name = tensor("op_2973_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_2973_end_0 = const()[name = tensor("op_2973_end_0"), val = tensor([2, 77, 1, 1280])]; + tensor var_2973_end_mask_0 = const()[name = tensor("op_2973_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_2973_cast_fp16 = slice_by_index(begin = var_2973_begin_0, end = var_2973_end_0, end_mask = var_2973_end_mask_0, x = transpose_22)[name = tensor("op_2973_cast_fp16")]; + tensor var_2975_begin_0 = const()[name = tensor("op_2975_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_2975_end_0 = const()[name = tensor("op_2975_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_2975_end_mask_0 = const()[name = tensor("op_2975_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2975_cast_fp16 = slice_by_index(begin = var_2975_begin_0, end = var_2975_end_0, end_mask = var_2975_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2975_cast_fp16")]; + tensor var_2979_begin_0 = const()[name = tensor("op_2979_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_2979_end_0 = const()[name = tensor("op_2979_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_2979_end_mask_0 = const()[name = tensor("op_2979_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2979_cast_fp16 = slice_by_index(begin = var_2979_begin_0, end = var_2979_end_0, end_mask = var_2979_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2979_cast_fp16")]; + tensor var_2983_begin_0 = const()[name = tensor("op_2983_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_2983_end_0 = const()[name = tensor("op_2983_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_2983_end_mask_0 = const()[name = tensor("op_2983_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2983_cast_fp16 = slice_by_index(begin = var_2983_begin_0, end = var_2983_end_0, end_mask = var_2983_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2983_cast_fp16")]; + tensor var_2987_begin_0 = const()[name = tensor("op_2987_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_2987_end_0 = const()[name = tensor("op_2987_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_2987_end_mask_0 = const()[name = tensor("op_2987_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2987_cast_fp16 = slice_by_index(begin = var_2987_begin_0, end = var_2987_end_0, end_mask = var_2987_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2987_cast_fp16")]; + tensor var_2991_begin_0 = const()[name = tensor("op_2991_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_2991_end_0 = const()[name = tensor("op_2991_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_2991_end_mask_0 = const()[name = tensor("op_2991_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2991_cast_fp16 = slice_by_index(begin = var_2991_begin_0, end = var_2991_end_0, end_mask = var_2991_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2991_cast_fp16")]; + tensor var_2995_begin_0 = const()[name = tensor("op_2995_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_2995_end_0 = const()[name = tensor("op_2995_end_0"), val = tensor([2, 384, 1, 77])]; + tensor var_2995_end_mask_0 = const()[name = tensor("op_2995_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2995_cast_fp16 = slice_by_index(begin = var_2995_begin_0, end = var_2995_end_0, end_mask = var_2995_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2995_cast_fp16")]; + tensor var_2999_begin_0 = const()[name = tensor("op_2999_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_2999_end_0 = const()[name = tensor("op_2999_end_0"), val = tensor([2, 448, 1, 77])]; + tensor var_2999_end_mask_0 = const()[name = tensor("op_2999_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_2999_cast_fp16 = slice_by_index(begin = var_2999_begin_0, end = var_2999_end_0, end_mask = var_2999_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2999_cast_fp16")]; + tensor var_3003_begin_0 = const()[name = tensor("op_3003_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_3003_end_0 = const()[name = tensor("op_3003_end_0"), val = tensor([2, 512, 1, 77])]; + tensor var_3003_end_mask_0 = const()[name = tensor("op_3003_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3003_cast_fp16 = slice_by_index(begin = var_3003_begin_0, end = var_3003_end_0, end_mask = var_3003_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3003_cast_fp16")]; + tensor var_3007_begin_0 = const()[name = tensor("op_3007_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_3007_end_0 = const()[name = tensor("op_3007_end_0"), val = tensor([2, 576, 1, 77])]; + tensor var_3007_end_mask_0 = const()[name = tensor("op_3007_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3007_cast_fp16 = slice_by_index(begin = var_3007_begin_0, end = var_3007_end_0, end_mask = var_3007_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3007_cast_fp16")]; + tensor var_3011_begin_0 = const()[name = tensor("op_3011_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_3011_end_0 = const()[name = tensor("op_3011_end_0"), val = tensor([2, 640, 1, 77])]; + tensor var_3011_end_mask_0 = const()[name = tensor("op_3011_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3011_cast_fp16 = slice_by_index(begin = var_3011_begin_0, end = var_3011_end_0, end_mask = var_3011_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3011_cast_fp16")]; + tensor var_3015_begin_0 = const()[name = tensor("op_3015_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_3015_end_0 = const()[name = tensor("op_3015_end_0"), val = tensor([2, 704, 1, 77])]; + tensor var_3015_end_mask_0 = const()[name = tensor("op_3015_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3015_cast_fp16 = slice_by_index(begin = var_3015_begin_0, end = var_3015_end_0, end_mask = var_3015_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3015_cast_fp16")]; + tensor var_3019_begin_0 = const()[name = tensor("op_3019_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_3019_end_0 = const()[name = tensor("op_3019_end_0"), val = tensor([2, 768, 1, 77])]; + tensor var_3019_end_mask_0 = const()[name = tensor("op_3019_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3019_cast_fp16 = slice_by_index(begin = var_3019_begin_0, end = var_3019_end_0, end_mask = var_3019_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3019_cast_fp16")]; + tensor var_3023_begin_0 = const()[name = tensor("op_3023_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_3023_end_0 = const()[name = tensor("op_3023_end_0"), val = tensor([2, 832, 1, 77])]; + tensor var_3023_end_mask_0 = const()[name = tensor("op_3023_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3023_cast_fp16 = slice_by_index(begin = var_3023_begin_0, end = var_3023_end_0, end_mask = var_3023_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3023_cast_fp16")]; + tensor var_3027_begin_0 = const()[name = tensor("op_3027_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_3027_end_0 = const()[name = tensor("op_3027_end_0"), val = tensor([2, 896, 1, 77])]; + tensor var_3027_end_mask_0 = const()[name = tensor("op_3027_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3027_cast_fp16 = slice_by_index(begin = var_3027_begin_0, end = var_3027_end_0, end_mask = var_3027_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3027_cast_fp16")]; + tensor var_3031_begin_0 = const()[name = tensor("op_3031_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_3031_end_0 = const()[name = tensor("op_3031_end_0"), val = tensor([2, 960, 1, 77])]; + tensor var_3031_end_mask_0 = const()[name = tensor("op_3031_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3031_cast_fp16 = slice_by_index(begin = var_3031_begin_0, end = var_3031_end_0, end_mask = var_3031_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3031_cast_fp16")]; + tensor var_3035_begin_0 = const()[name = tensor("op_3035_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_3035_end_0 = const()[name = tensor("op_3035_end_0"), val = tensor([2, 1024, 1, 77])]; + tensor var_3035_end_mask_0 = const()[name = tensor("op_3035_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3035_cast_fp16 = slice_by_index(begin = var_3035_begin_0, end = var_3035_end_0, end_mask = var_3035_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3035_cast_fp16")]; + tensor var_3039_begin_0 = const()[name = tensor("op_3039_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_3039_end_0 = const()[name = tensor("op_3039_end_0"), val = tensor([2, 1088, 1, 77])]; + tensor var_3039_end_mask_0 = const()[name = tensor("op_3039_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3039_cast_fp16 = slice_by_index(begin = var_3039_begin_0, end = var_3039_end_0, end_mask = var_3039_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3039_cast_fp16")]; + tensor var_3043_begin_0 = const()[name = tensor("op_3043_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_3043_end_0 = const()[name = tensor("op_3043_end_0"), val = tensor([2, 1152, 1, 77])]; + tensor var_3043_end_mask_0 = const()[name = tensor("op_3043_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3043_cast_fp16 = slice_by_index(begin = var_3043_begin_0, end = var_3043_end_0, end_mask = var_3043_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3043_cast_fp16")]; + tensor var_3047_begin_0 = const()[name = tensor("op_3047_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_3047_end_0 = const()[name = tensor("op_3047_end_0"), val = tensor([2, 1216, 1, 77])]; + tensor var_3047_end_mask_0 = const()[name = tensor("op_3047_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3047_cast_fp16 = slice_by_index(begin = var_3047_begin_0, end = var_3047_end_0, end_mask = var_3047_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3047_cast_fp16")]; + tensor var_3051_begin_0 = const()[name = tensor("op_3051_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_3051_end_0 = const()[name = tensor("op_3051_end_0"), val = tensor([2, 1280, 1, 77])]; + tensor var_3051_end_mask_0 = const()[name = tensor("op_3051_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3051_cast_fp16 = slice_by_index(begin = var_3051_begin_0, end = var_3051_end_0, end_mask = var_3051_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3051_cast_fp16")]; + tensor var_3055_equation_0 = const()[name = tensor("op_3055_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3055_cast_fp16 = einsum(equation = var_3055_equation_0, values = (var_2897_cast_fp16, var_2814_cast_fp16))[name = tensor("op_3055_cast_fp16")]; + tensor var_3056_to_fp16 = const()[name = tensor("op_3056_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_161_cast_fp16 = mul(x = var_3055_cast_fp16, y = var_3056_to_fp16)[name = tensor("aw_161_cast_fp16")]; + tensor var_3059_equation_0 = const()[name = tensor("op_3059_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3059_cast_fp16 = einsum(equation = var_3059_equation_0, values = (var_2901_cast_fp16, var_2818_cast_fp16))[name = tensor("op_3059_cast_fp16")]; + tensor var_3060_to_fp16 = const()[name = tensor("op_3060_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_163_cast_fp16 = mul(x = var_3059_cast_fp16, y = var_3060_to_fp16)[name = tensor("aw_163_cast_fp16")]; + tensor var_3063_equation_0 = const()[name = tensor("op_3063_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3063_cast_fp16 = einsum(equation = var_3063_equation_0, values = (var_2905_cast_fp16, var_2822_cast_fp16))[name = tensor("op_3063_cast_fp16")]; + tensor var_3064_to_fp16 = const()[name = tensor("op_3064_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_165_cast_fp16 = mul(x = var_3063_cast_fp16, y = var_3064_to_fp16)[name = tensor("aw_165_cast_fp16")]; + tensor var_3067_equation_0 = const()[name = tensor("op_3067_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3067_cast_fp16 = einsum(equation = var_3067_equation_0, values = (var_2909_cast_fp16, var_2826_cast_fp16))[name = tensor("op_3067_cast_fp16")]; + tensor var_3068_to_fp16 = const()[name = tensor("op_3068_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_167_cast_fp16 = mul(x = var_3067_cast_fp16, y = var_3068_to_fp16)[name = tensor("aw_167_cast_fp16")]; + tensor var_3071_equation_0 = const()[name = tensor("op_3071_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3071_cast_fp16 = einsum(equation = var_3071_equation_0, values = (var_2913_cast_fp16, var_2830_cast_fp16))[name = tensor("op_3071_cast_fp16")]; + tensor var_3072_to_fp16 = const()[name = tensor("op_3072_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_169_cast_fp16 = mul(x = var_3071_cast_fp16, y = var_3072_to_fp16)[name = tensor("aw_169_cast_fp16")]; + tensor var_3075_equation_0 = const()[name = tensor("op_3075_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3075_cast_fp16 = einsum(equation = var_3075_equation_0, values = (var_2917_cast_fp16, var_2834_cast_fp16))[name = tensor("op_3075_cast_fp16")]; + tensor var_3076_to_fp16 = const()[name = tensor("op_3076_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_171_cast_fp16 = mul(x = var_3075_cast_fp16, y = var_3076_to_fp16)[name = tensor("aw_171_cast_fp16")]; + tensor var_3079_equation_0 = const()[name = tensor("op_3079_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3079_cast_fp16 = einsum(equation = var_3079_equation_0, values = (var_2921_cast_fp16, var_2838_cast_fp16))[name = tensor("op_3079_cast_fp16")]; + tensor var_3080_to_fp16 = const()[name = tensor("op_3080_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_173_cast_fp16 = mul(x = var_3079_cast_fp16, y = var_3080_to_fp16)[name = tensor("aw_173_cast_fp16")]; + tensor var_3083_equation_0 = const()[name = tensor("op_3083_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3083_cast_fp16 = einsum(equation = var_3083_equation_0, values = (var_2925_cast_fp16, var_2842_cast_fp16))[name = tensor("op_3083_cast_fp16")]; + tensor var_3084_to_fp16 = const()[name = tensor("op_3084_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_175_cast_fp16 = mul(x = var_3083_cast_fp16, y = var_3084_to_fp16)[name = tensor("aw_175_cast_fp16")]; + tensor var_3087_equation_0 = const()[name = tensor("op_3087_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3087_cast_fp16 = einsum(equation = var_3087_equation_0, values = (var_2929_cast_fp16, var_2846_cast_fp16))[name = tensor("op_3087_cast_fp16")]; + tensor var_3088_to_fp16 = const()[name = tensor("op_3088_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_177_cast_fp16 = mul(x = var_3087_cast_fp16, y = var_3088_to_fp16)[name = tensor("aw_177_cast_fp16")]; + tensor var_3091_equation_0 = const()[name = tensor("op_3091_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3091_cast_fp16 = einsum(equation = var_3091_equation_0, values = (var_2933_cast_fp16, var_2850_cast_fp16))[name = tensor("op_3091_cast_fp16")]; + tensor var_3092_to_fp16 = const()[name = tensor("op_3092_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_179_cast_fp16 = mul(x = var_3091_cast_fp16, y = var_3092_to_fp16)[name = tensor("aw_179_cast_fp16")]; + tensor var_3095_equation_0 = const()[name = tensor("op_3095_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3095_cast_fp16 = einsum(equation = var_3095_equation_0, values = (var_2937_cast_fp16, var_2854_cast_fp16))[name = tensor("op_3095_cast_fp16")]; + tensor var_3096_to_fp16 = const()[name = tensor("op_3096_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_181_cast_fp16 = mul(x = var_3095_cast_fp16, y = var_3096_to_fp16)[name = tensor("aw_181_cast_fp16")]; + tensor var_3099_equation_0 = const()[name = tensor("op_3099_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3099_cast_fp16 = einsum(equation = var_3099_equation_0, values = (var_2941_cast_fp16, var_2858_cast_fp16))[name = tensor("op_3099_cast_fp16")]; + tensor var_3100_to_fp16 = const()[name = tensor("op_3100_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_183_cast_fp16 = mul(x = var_3099_cast_fp16, y = var_3100_to_fp16)[name = tensor("aw_183_cast_fp16")]; + tensor var_3103_equation_0 = const()[name = tensor("op_3103_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3103_cast_fp16 = einsum(equation = var_3103_equation_0, values = (var_2945_cast_fp16, var_2862_cast_fp16))[name = tensor("op_3103_cast_fp16")]; + tensor var_3104_to_fp16 = const()[name = tensor("op_3104_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_185_cast_fp16 = mul(x = var_3103_cast_fp16, y = var_3104_to_fp16)[name = tensor("aw_185_cast_fp16")]; + tensor var_3107_equation_0 = const()[name = tensor("op_3107_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3107_cast_fp16 = einsum(equation = var_3107_equation_0, values = (var_2949_cast_fp16, var_2866_cast_fp16))[name = tensor("op_3107_cast_fp16")]; + tensor var_3108_to_fp16 = const()[name = tensor("op_3108_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_187_cast_fp16 = mul(x = var_3107_cast_fp16, y = var_3108_to_fp16)[name = tensor("aw_187_cast_fp16")]; + tensor var_3111_equation_0 = const()[name = tensor("op_3111_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3111_cast_fp16 = einsum(equation = var_3111_equation_0, values = (var_2953_cast_fp16, var_2870_cast_fp16))[name = tensor("op_3111_cast_fp16")]; + tensor var_3112_to_fp16 = const()[name = tensor("op_3112_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_189_cast_fp16 = mul(x = var_3111_cast_fp16, y = var_3112_to_fp16)[name = tensor("aw_189_cast_fp16")]; + tensor var_3115_equation_0 = const()[name = tensor("op_3115_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3115_cast_fp16 = einsum(equation = var_3115_equation_0, values = (var_2957_cast_fp16, var_2874_cast_fp16))[name = tensor("op_3115_cast_fp16")]; + tensor var_3116_to_fp16 = const()[name = tensor("op_3116_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_191_cast_fp16 = mul(x = var_3115_cast_fp16, y = var_3116_to_fp16)[name = tensor("aw_191_cast_fp16")]; + tensor var_3119_equation_0 = const()[name = tensor("op_3119_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3119_cast_fp16 = einsum(equation = var_3119_equation_0, values = (var_2961_cast_fp16, var_2878_cast_fp16))[name = tensor("op_3119_cast_fp16")]; + tensor var_3120_to_fp16 = const()[name = tensor("op_3120_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_193_cast_fp16 = mul(x = var_3119_cast_fp16, y = var_3120_to_fp16)[name = tensor("aw_193_cast_fp16")]; + tensor var_3123_equation_0 = const()[name = tensor("op_3123_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3123_cast_fp16 = einsum(equation = var_3123_equation_0, values = (var_2965_cast_fp16, var_2882_cast_fp16))[name = tensor("op_3123_cast_fp16")]; + tensor var_3124_to_fp16 = const()[name = tensor("op_3124_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_195_cast_fp16 = mul(x = var_3123_cast_fp16, y = var_3124_to_fp16)[name = tensor("aw_195_cast_fp16")]; + tensor var_3127_equation_0 = const()[name = tensor("op_3127_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3127_cast_fp16 = einsum(equation = var_3127_equation_0, values = (var_2969_cast_fp16, var_2886_cast_fp16))[name = tensor("op_3127_cast_fp16")]; + tensor var_3128_to_fp16 = const()[name = tensor("op_3128_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_197_cast_fp16 = mul(x = var_3127_cast_fp16, y = var_3128_to_fp16)[name = tensor("aw_197_cast_fp16")]; + tensor var_3131_equation_0 = const()[name = tensor("op_3131_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3131_cast_fp16 = einsum(equation = var_3131_equation_0, values = (var_2973_cast_fp16, var_2890_cast_fp16))[name = tensor("op_3131_cast_fp16")]; + tensor var_3132_to_fp16 = const()[name = tensor("op_3132_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_199_cast_fp16 = mul(x = var_3131_cast_fp16, y = var_3132_to_fp16)[name = tensor("aw_199_cast_fp16")]; + tensor var_3134_cast_fp16 = softmax(axis = var_2254, x = aw_161_cast_fp16)[name = tensor("op_3134_cast_fp16")]; + tensor var_3135_cast_fp16 = softmax(axis = var_2254, x = aw_163_cast_fp16)[name = tensor("op_3135_cast_fp16")]; + tensor var_3136_cast_fp16 = softmax(axis = var_2254, x = aw_165_cast_fp16)[name = tensor("op_3136_cast_fp16")]; + tensor var_3137_cast_fp16 = softmax(axis = var_2254, x = aw_167_cast_fp16)[name = tensor("op_3137_cast_fp16")]; + tensor var_3138_cast_fp16 = softmax(axis = var_2254, x = aw_169_cast_fp16)[name = tensor("op_3138_cast_fp16")]; + tensor var_3139_cast_fp16 = softmax(axis = var_2254, x = aw_171_cast_fp16)[name = tensor("op_3139_cast_fp16")]; + tensor var_3140_cast_fp16 = softmax(axis = var_2254, x = aw_173_cast_fp16)[name = tensor("op_3140_cast_fp16")]; + tensor var_3141_cast_fp16 = softmax(axis = var_2254, x = aw_175_cast_fp16)[name = tensor("op_3141_cast_fp16")]; + tensor var_3142_cast_fp16 = softmax(axis = var_2254, x = aw_177_cast_fp16)[name = tensor("op_3142_cast_fp16")]; + tensor var_3143_cast_fp16 = softmax(axis = var_2254, x = aw_179_cast_fp16)[name = tensor("op_3143_cast_fp16")]; + tensor var_3144_cast_fp16 = softmax(axis = var_2254, x = aw_181_cast_fp16)[name = tensor("op_3144_cast_fp16")]; + tensor var_3145_cast_fp16 = softmax(axis = var_2254, x = aw_183_cast_fp16)[name = tensor("op_3145_cast_fp16")]; + tensor var_3146_cast_fp16 = softmax(axis = var_2254, x = aw_185_cast_fp16)[name = tensor("op_3146_cast_fp16")]; + tensor var_3147_cast_fp16 = softmax(axis = var_2254, x = aw_187_cast_fp16)[name = tensor("op_3147_cast_fp16")]; + tensor var_3148_cast_fp16 = softmax(axis = var_2254, x = aw_189_cast_fp16)[name = tensor("op_3148_cast_fp16")]; + tensor var_3149_cast_fp16 = softmax(axis = var_2254, x = aw_191_cast_fp16)[name = tensor("op_3149_cast_fp16")]; + tensor var_3150_cast_fp16 = softmax(axis = var_2254, x = aw_193_cast_fp16)[name = tensor("op_3150_cast_fp16")]; + tensor var_3151_cast_fp16 = softmax(axis = var_2254, x = aw_195_cast_fp16)[name = tensor("op_3151_cast_fp16")]; + tensor var_3152_cast_fp16 = softmax(axis = var_2254, x = aw_197_cast_fp16)[name = tensor("op_3152_cast_fp16")]; + tensor var_3153_cast_fp16 = softmax(axis = var_2254, x = aw_199_cast_fp16)[name = tensor("op_3153_cast_fp16")]; + tensor var_3155_equation_0 = const()[name = tensor("op_3155_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3155_cast_fp16 = einsum(equation = var_3155_equation_0, values = (var_2975_cast_fp16, var_3134_cast_fp16))[name = tensor("op_3155_cast_fp16")]; + tensor var_3157_equation_0 = const()[name = tensor("op_3157_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3157_cast_fp16 = einsum(equation = var_3157_equation_0, values = (var_2979_cast_fp16, var_3135_cast_fp16))[name = tensor("op_3157_cast_fp16")]; + tensor var_3159_equation_0 = const()[name = tensor("op_3159_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3159_cast_fp16 = einsum(equation = var_3159_equation_0, values = (var_2983_cast_fp16, var_3136_cast_fp16))[name = tensor("op_3159_cast_fp16")]; + tensor var_3161_equation_0 = const()[name = tensor("op_3161_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3161_cast_fp16 = einsum(equation = var_3161_equation_0, values = (var_2987_cast_fp16, var_3137_cast_fp16))[name = tensor("op_3161_cast_fp16")]; + tensor var_3163_equation_0 = const()[name = tensor("op_3163_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3163_cast_fp16 = einsum(equation = var_3163_equation_0, values = (var_2991_cast_fp16, var_3138_cast_fp16))[name = tensor("op_3163_cast_fp16")]; + tensor var_3165_equation_0 = const()[name = tensor("op_3165_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3165_cast_fp16 = einsum(equation = var_3165_equation_0, values = (var_2995_cast_fp16, var_3139_cast_fp16))[name = tensor("op_3165_cast_fp16")]; + tensor var_3167_equation_0 = const()[name = tensor("op_3167_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3167_cast_fp16 = einsum(equation = var_3167_equation_0, values = (var_2999_cast_fp16, var_3140_cast_fp16))[name = tensor("op_3167_cast_fp16")]; + tensor var_3169_equation_0 = const()[name = tensor("op_3169_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3169_cast_fp16 = einsum(equation = var_3169_equation_0, values = (var_3003_cast_fp16, var_3141_cast_fp16))[name = tensor("op_3169_cast_fp16")]; + tensor var_3171_equation_0 = const()[name = tensor("op_3171_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3171_cast_fp16 = einsum(equation = var_3171_equation_0, values = (var_3007_cast_fp16, var_3142_cast_fp16))[name = tensor("op_3171_cast_fp16")]; + tensor var_3173_equation_0 = const()[name = tensor("op_3173_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3173_cast_fp16 = einsum(equation = var_3173_equation_0, values = (var_3011_cast_fp16, var_3143_cast_fp16))[name = tensor("op_3173_cast_fp16")]; + tensor var_3175_equation_0 = const()[name = tensor("op_3175_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3175_cast_fp16 = einsum(equation = var_3175_equation_0, values = (var_3015_cast_fp16, var_3144_cast_fp16))[name = tensor("op_3175_cast_fp16")]; + tensor var_3177_equation_0 = const()[name = tensor("op_3177_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3177_cast_fp16 = einsum(equation = var_3177_equation_0, values = (var_3019_cast_fp16, var_3145_cast_fp16))[name = tensor("op_3177_cast_fp16")]; + tensor var_3179_equation_0 = const()[name = tensor("op_3179_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3179_cast_fp16 = einsum(equation = var_3179_equation_0, values = (var_3023_cast_fp16, var_3146_cast_fp16))[name = tensor("op_3179_cast_fp16")]; + tensor var_3181_equation_0 = const()[name = tensor("op_3181_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3181_cast_fp16 = einsum(equation = var_3181_equation_0, values = (var_3027_cast_fp16, var_3147_cast_fp16))[name = tensor("op_3181_cast_fp16")]; + tensor var_3183_equation_0 = const()[name = tensor("op_3183_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3183_cast_fp16 = einsum(equation = var_3183_equation_0, values = (var_3031_cast_fp16, var_3148_cast_fp16))[name = tensor("op_3183_cast_fp16")]; + tensor var_3185_equation_0 = const()[name = tensor("op_3185_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3185_cast_fp16 = einsum(equation = var_3185_equation_0, values = (var_3035_cast_fp16, var_3149_cast_fp16))[name = tensor("op_3185_cast_fp16")]; + tensor var_3187_equation_0 = const()[name = tensor("op_3187_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3187_cast_fp16 = einsum(equation = var_3187_equation_0, values = (var_3039_cast_fp16, var_3150_cast_fp16))[name = tensor("op_3187_cast_fp16")]; + tensor var_3189_equation_0 = const()[name = tensor("op_3189_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3189_cast_fp16 = einsum(equation = var_3189_equation_0, values = (var_3043_cast_fp16, var_3151_cast_fp16))[name = tensor("op_3189_cast_fp16")]; + tensor var_3191_equation_0 = const()[name = tensor("op_3191_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3191_cast_fp16 = einsum(equation = var_3191_equation_0, values = (var_3047_cast_fp16, var_3152_cast_fp16))[name = tensor("op_3191_cast_fp16")]; + tensor var_3193_equation_0 = const()[name = tensor("op_3193_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3193_cast_fp16 = einsum(equation = var_3193_equation_0, values = (var_3051_cast_fp16, var_3153_cast_fp16))[name = tensor("op_3193_cast_fp16")]; + tensor input_135_interleave_0 = const()[name = tensor("input_135_interleave_0"), val = tensor(false)]; + tensor input_135_cast_fp16 = concat(axis = var_2254, interleave = input_135_interleave_0, values = (var_3155_cast_fp16, var_3157_cast_fp16, var_3159_cast_fp16, var_3161_cast_fp16, var_3163_cast_fp16, var_3165_cast_fp16, var_3167_cast_fp16, var_3169_cast_fp16, var_3171_cast_fp16, var_3173_cast_fp16, var_3175_cast_fp16, var_3177_cast_fp16, var_3179_cast_fp16, var_3181_cast_fp16, var_3183_cast_fp16, var_3185_cast_fp16, var_3187_cast_fp16, var_3189_cast_fp16, var_3191_cast_fp16, var_3193_cast_fp16))[name = tensor("input_135_cast_fp16")]; + tensor var_3199 = const()[name = tensor("op_3199"), val = tensor([1, 1])]; + tensor var_3201 = const()[name = tensor("op_3201"), val = tensor([1, 1])]; + tensor var_3203_pad_type_0 = const()[name = tensor("op_3203_pad_type_0"), val = tensor("custom")]; + tensor var_3203_pad_0 = const()[name = tensor("op_3203_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(174892608)))]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178169472)))]; + tensor var_3203_cast_fp16 = conv(bias = down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_3201, groups = var_2254, pad = var_3203_pad_0, pad_type = var_3203_pad_type_0, strides = var_3199, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_135_cast_fp16)[name = tensor("op_3203_cast_fp16")]; + tensor inputs_29_cast_fp16 = add(x = var_3203_cast_fp16, y = inputs_27_cast_fp16)[name = tensor("inputs_29_cast_fp16")]; + tensor var_3207 = const()[name = tensor("op_3207"), val = tensor([1])]; + tensor channels_mean_29_cast_fp16 = reduce_mean(axes = var_3207, keep_dims = var_2249, x = inputs_29_cast_fp16)[name = tensor("channels_mean_29_cast_fp16")]; + tensor zero_mean_29_cast_fp16 = sub(x = inputs_29_cast_fp16, y = channels_mean_29_cast_fp16)[name = tensor("zero_mean_29_cast_fp16")]; + tensor zero_mean_sq_29_cast_fp16 = mul(x = zero_mean_29_cast_fp16, y = zero_mean_29_cast_fp16)[name = tensor("zero_mean_sq_29_cast_fp16")]; + tensor var_3211 = const()[name = tensor("op_3211"), val = tensor([1])]; + tensor var_3212_cast_fp16 = reduce_mean(axes = var_3211, keep_dims = var_2249, x = zero_mean_sq_29_cast_fp16)[name = tensor("op_3212_cast_fp16")]; + tensor var_3213_to_fp16 = const()[name = tensor("op_3213_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_3214_cast_fp16 = add(x = var_3212_cast_fp16, y = var_3213_to_fp16)[name = tensor("op_3214_cast_fp16")]; + tensor denom_29_epsilon_0_to_fp16 = const()[name = tensor("denom_29_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_29_cast_fp16 = rsqrt(epsilon = denom_29_epsilon_0_to_fp16, x = var_3214_cast_fp16)[name = tensor("denom_29_cast_fp16")]; + tensor out_29_cast_fp16 = mul(x = zero_mean_29_cast_fp16, y = denom_29_cast_fp16)[name = tensor("out_29_cast_fp16")]; + tensor var_3218_to_fp16 = const()[name = tensor("op_3218_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178172096)))]; + tensor var_3219_cast_fp16 = add(x = out_29_cast_fp16, y = var_3218_to_fp16)[name = tensor("op_3219_cast_fp16")]; + tensor var_3221_to_fp16 = const()[name = tensor("op_3221_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178174720)))]; + tensor input_137_cast_fp16 = mul(x = var_3219_cast_fp16, y = var_3221_to_fp16)[name = tensor("input_137_cast_fp16")]; + tensor var_3229 = const()[name = tensor("op_3229"), val = tensor([1, 1])]; + tensor var_3231 = const()[name = tensor("op_3231"), val = tensor([1, 1])]; + tensor var_3233_pad_type_0 = const()[name = tensor("op_3233_pad_type_0"), val = tensor("custom")]; + tensor var_3233_pad_0 = const()[name = tensor("op_3233_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178177344)))]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(204391808)))]; + tensor var_3233_cast_fp16 = conv(bias = down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_3231, groups = var_2254, pad = var_3233_pad_0, pad_type = var_3233_pad_type_0, strides = var_3229, weight = down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_137_cast_fp16)[name = tensor("op_3233_cast_fp16")]; + tensor var_3234_split_sizes_0 = const()[name = tensor("op_3234_split_sizes_0"), val = tensor([5120, 5120])]; + tensor var_3234_axis_0 = const()[name = tensor("op_3234_axis_0"), val = tensor(1)]; + tensor var_3234_cast_fp16_0, tensor var_3234_cast_fp16_1 = split(axis = var_3234_axis_0, split_sizes = var_3234_split_sizes_0, x = var_3233_cast_fp16)[name = tensor("op_3234_cast_fp16")]; + tensor var_3236_mode_0 = const()[name = tensor("op_3236_mode_0"), val = tensor("EXACT")]; + tensor var_3236_cast_fp16 = gelu(mode = var_3236_mode_0, x = var_3234_cast_fp16_1)[name = tensor("op_3236_cast_fp16")]; + tensor input_139_cast_fp16 = mul(x = var_3234_cast_fp16_0, y = var_3236_cast_fp16)[name = tensor("input_139_cast_fp16")]; + tensor var_3240 = const()[name = tensor("op_3240"), val = tensor([1, 1])]; + tensor var_3242 = const()[name = tensor("op_3242"), val = tensor([1, 1])]; + tensor var_3244_pad_type_0 = const()[name = tensor("op_3244_pad_type_0"), val = tensor("custom")]; + tensor var_3244_pad_0 = const()[name = tensor("op_3244_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(204412352)))]; + tensor down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217519616)))]; + tensor var_3244_cast_fp16 = conv(bias = down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_3242, groups = var_2254, pad = var_3244_pad_0, pad_type = var_3244_pad_type_0, strides = var_3240, weight = down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_139_cast_fp16)[name = tensor("op_3244_cast_fp16")]; + tensor hidden_states_87_cast_fp16 = add(x = var_3244_cast_fp16, y = inputs_29_cast_fp16)[name = tensor("hidden_states_87_cast_fp16")]; + tensor var_3246 = const()[name = tensor("op_3246"), val = tensor([2, 1280, 12, 12])]; + tensor input_141_cast_fp16 = reshape(shape = var_3246, x = hidden_states_87_cast_fp16)[name = tensor("input_141_cast_fp16")]; + tensor var_3250 = const()[name = tensor("op_3250"), val = tensor([1, 1])]; + tensor var_3252 = const()[name = tensor("op_3252"), val = tensor([1, 1])]; + tensor hidden_states_89_pad_type_0 = const()[name = tensor("hidden_states_89_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_89_pad_0 = const()[name = tensor("hidden_states_89_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_0_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217522240)))]; + tensor down_blocks_2_attentions_0_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220799104)))]; + tensor hidden_states_89_cast_fp16 = conv(bias = down_blocks_2_attentions_0_proj_out_bias_to_fp16, dilations = var_3252, groups = var_2254, pad = hidden_states_89_pad_0, pad_type = hidden_states_89_pad_type_0, strides = var_3250, weight = down_blocks_2_attentions_0_proj_out_weight_to_fp16, x = input_141_cast_fp16)[name = tensor("hidden_states_89_cast_fp16")]; + tensor input_143_cast_fp16 = add(x = hidden_states_89_cast_fp16, y = hidden_states_77_cast_fp16)[name = tensor("input_143_cast_fp16")]; + tensor reshape_60_shape_0 = const()[name = tensor("reshape_60_shape_0"), val = tensor([2, 32, 40, 12, 12])]; + tensor reshape_60_cast_fp16 = reshape(shape = reshape_60_shape_0, x = input_143_cast_fp16)[name = tensor("reshape_60_cast_fp16")]; + tensor reduce_mean_45_axes_0 = const()[name = tensor("reduce_mean_45_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_45_keep_dims_0 = const()[name = tensor("reduce_mean_45_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_45_cast_fp16 = reduce_mean(axes = reduce_mean_45_axes_0, keep_dims = reduce_mean_45_keep_dims_0, x = reshape_60_cast_fp16)[name = tensor("reduce_mean_45_cast_fp16")]; + tensor sub_30_cast_fp16 = sub(x = reshape_60_cast_fp16, y = reduce_mean_45_cast_fp16)[name = tensor("sub_30_cast_fp16")]; + tensor square_15_cast_fp16 = square(x = sub_30_cast_fp16)[name = tensor("square_15_cast_fp16")]; + tensor reduce_mean_47_axes_0 = const()[name = tensor("reduce_mean_47_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_47_keep_dims_0 = const()[name = tensor("reduce_mean_47_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_47_cast_fp16 = reduce_mean(axes = reduce_mean_47_axes_0, keep_dims = reduce_mean_47_keep_dims_0, x = square_15_cast_fp16)[name = tensor("reduce_mean_47_cast_fp16")]; + tensor add_30_y_0_to_fp16 = const()[name = tensor("add_30_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_30_cast_fp16 = add(x = reduce_mean_47_cast_fp16, y = add_30_y_0_to_fp16)[name = tensor("add_30_cast_fp16")]; + tensor sqrt_15_cast_fp16 = sqrt(x = add_30_cast_fp16)[name = tensor("sqrt_15_cast_fp16")]; + tensor real_div_15_cast_fp16 = real_div(x = sub_30_cast_fp16, y = sqrt_15_cast_fp16)[name = tensor("real_div_15_cast_fp16")]; + tensor reshape_61_shape_0 = const()[name = tensor("reshape_61_shape_0"), val = tensor([2, 1280, 12, 12])]; + tensor reshape_61_cast_fp16 = reshape(shape = reshape_61_shape_0, x = real_div_15_cast_fp16)[name = tensor("reshape_61_cast_fp16")]; + tensor add_31_gamma_0_to_fp16 = const()[name = tensor("add_31_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220801728)))]; + tensor add_31_beta_0_to_fp16 = const()[name = tensor("add_31_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220804352)))]; + tensor add_31_epsilon_0_to_fp16 = const()[name = tensor("add_31_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_31_cast_fp16 = batch_norm(beta = add_31_beta_0_to_fp16, epsilon = add_31_epsilon_0_to_fp16, gamma = add_31_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_61_cast_fp16)[name = tensor("add_31_cast_fp16")]; + tensor input_147_cast_fp16 = silu(x = add_31_cast_fp16)[name = tensor("input_147_cast_fp16")]; + tensor var_3267 = const()[name = tensor("op_3267"), val = tensor([1, 1])]; + tensor var_3269 = const()[name = tensor("op_3269"), val = tensor([1, 1])]; + tensor hidden_states_91_pad_type_0 = const()[name = tensor("hidden_states_91_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_91_pad_0 = const()[name = tensor("hidden_states_91_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_2_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220806976)))]; + tensor down_blocks_2_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250298240)))]; + tensor hidden_states_91_cast_fp16 = conv(bias = down_blocks_2_resnets_1_conv1_bias_to_fp16, dilations = var_3269, groups = var_2254, pad = hidden_states_91_pad_0, pad_type = hidden_states_91_pad_type_0, strides = var_3267, weight = down_blocks_2_resnets_1_conv1_weight_to_fp16, x = input_147_cast_fp16)[name = tensor("hidden_states_91_cast_fp16")]; + tensor var_3275 = const()[name = tensor("op_3275"), val = tensor([1, 1])]; + tensor var_3277 = const()[name = tensor("op_3277"), val = tensor([1, 1])]; + tensor temb_11_pad_type_0 = const()[name = tensor("temb_11_pad_type_0"), val = tensor("custom")]; + tensor temb_11_pad_0 = const()[name = tensor("temb_11_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250300864)))]; + tensor down_blocks_2_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253577728)))]; + tensor temb_11_cast_fp16 = conv(bias = down_blocks_2_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_3277, groups = var_2254, pad = temb_11_pad_0, pad_type = temb_11_pad_type_0, strides = var_3275, weight = down_blocks_2_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_11_cast_fp16")]; + tensor input_151_cast_fp16 = add(x = hidden_states_91_cast_fp16, y = temb_11_cast_fp16)[name = tensor("input_151_cast_fp16")]; + tensor reshape_64_shape_0 = const()[name = tensor("reshape_64_shape_0"), val = tensor([2, 32, 40, 12, 12])]; + tensor reshape_64_cast_fp16 = reshape(shape = reshape_64_shape_0, x = input_151_cast_fp16)[name = tensor("reshape_64_cast_fp16")]; + tensor reduce_mean_48_axes_0 = const()[name = tensor("reduce_mean_48_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_48_keep_dims_0 = const()[name = tensor("reduce_mean_48_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_48_cast_fp16 = reduce_mean(axes = reduce_mean_48_axes_0, keep_dims = reduce_mean_48_keep_dims_0, x = reshape_64_cast_fp16)[name = tensor("reduce_mean_48_cast_fp16")]; + tensor sub_32_cast_fp16 = sub(x = reshape_64_cast_fp16, y = reduce_mean_48_cast_fp16)[name = tensor("sub_32_cast_fp16")]; + tensor square_16_cast_fp16 = square(x = sub_32_cast_fp16)[name = tensor("square_16_cast_fp16")]; + tensor reduce_mean_50_axes_0 = const()[name = tensor("reduce_mean_50_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_50_keep_dims_0 = const()[name = tensor("reduce_mean_50_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_50_cast_fp16 = reduce_mean(axes = reduce_mean_50_axes_0, keep_dims = reduce_mean_50_keep_dims_0, x = square_16_cast_fp16)[name = tensor("reduce_mean_50_cast_fp16")]; + tensor add_32_y_0_to_fp16 = const()[name = tensor("add_32_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_32_cast_fp16 = add(x = reduce_mean_50_cast_fp16, y = add_32_y_0_to_fp16)[name = tensor("add_32_cast_fp16")]; + tensor sqrt_16_cast_fp16 = sqrt(x = add_32_cast_fp16)[name = tensor("sqrt_16_cast_fp16")]; + tensor real_div_16_cast_fp16 = real_div(x = sub_32_cast_fp16, y = sqrt_16_cast_fp16)[name = tensor("real_div_16_cast_fp16")]; + tensor reshape_65_shape_0 = const()[name = tensor("reshape_65_shape_0"), val = tensor([2, 1280, 12, 12])]; + tensor reshape_65_cast_fp16 = reshape(shape = reshape_65_shape_0, x = real_div_16_cast_fp16)[name = tensor("reshape_65_cast_fp16")]; + tensor add_33_gamma_0_to_fp16 = const()[name = tensor("add_33_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253580352)))]; + tensor add_33_beta_0_to_fp16 = const()[name = tensor("add_33_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253582976)))]; + tensor add_33_epsilon_0_to_fp16 = const()[name = tensor("add_33_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_33_cast_fp16 = batch_norm(beta = add_33_beta_0_to_fp16, epsilon = add_33_epsilon_0_to_fp16, gamma = add_33_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_65_cast_fp16)[name = tensor("add_33_cast_fp16")]; + tensor input_155_cast_fp16 = silu(x = add_33_cast_fp16)[name = tensor("input_155_cast_fp16")]; + tensor var_3287 = const()[name = tensor("op_3287"), val = tensor([1, 1])]; + tensor var_3289 = const()[name = tensor("op_3289"), val = tensor([1, 1])]; + tensor hidden_states_93_pad_type_0 = const()[name = tensor("hidden_states_93_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_93_pad_0 = const()[name = tensor("hidden_states_93_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_2_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253585600)))]; + tensor down_blocks_2_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(283076864)))]; + tensor hidden_states_93_cast_fp16 = conv(bias = down_blocks_2_resnets_1_conv2_bias_to_fp16, dilations = var_3289, groups = var_2254, pad = hidden_states_93_pad_0, pad_type = hidden_states_93_pad_type_0, strides = var_3287, weight = down_blocks_2_resnets_1_conv2_weight_to_fp16, x = input_155_cast_fp16)[name = tensor("hidden_states_93_cast_fp16")]; + tensor hidden_states_95_cast_fp16 = add(x = input_143_cast_fp16, y = hidden_states_93_cast_fp16)[name = tensor("hidden_states_95_cast_fp16")]; + tensor reshape_68_shape_0 = const()[name = tensor("reshape_68_shape_0"), val = tensor([2, 32, 40, 12, 12])]; + tensor reshape_68_cast_fp16 = reshape(shape = reshape_68_shape_0, x = hidden_states_95_cast_fp16)[name = tensor("reshape_68_cast_fp16")]; + tensor reduce_mean_51_axes_0 = const()[name = tensor("reduce_mean_51_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_51_keep_dims_0 = const()[name = tensor("reduce_mean_51_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_51_cast_fp16 = reduce_mean(axes = reduce_mean_51_axes_0, keep_dims = reduce_mean_51_keep_dims_0, x = reshape_68_cast_fp16)[name = tensor("reduce_mean_51_cast_fp16")]; + tensor sub_34_cast_fp16 = sub(x = reshape_68_cast_fp16, y = reduce_mean_51_cast_fp16)[name = tensor("sub_34_cast_fp16")]; + tensor square_17_cast_fp16 = square(x = sub_34_cast_fp16)[name = tensor("square_17_cast_fp16")]; + tensor reduce_mean_53_axes_0 = const()[name = tensor("reduce_mean_53_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_53_keep_dims_0 = const()[name = tensor("reduce_mean_53_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_53_cast_fp16 = reduce_mean(axes = reduce_mean_53_axes_0, keep_dims = reduce_mean_53_keep_dims_0, x = square_17_cast_fp16)[name = tensor("reduce_mean_53_cast_fp16")]; + tensor add_34_y_0_to_fp16 = const()[name = tensor("add_34_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_34_cast_fp16 = add(x = reduce_mean_53_cast_fp16, y = add_34_y_0_to_fp16)[name = tensor("add_34_cast_fp16")]; + tensor sqrt_17_cast_fp16 = sqrt(x = add_34_cast_fp16)[name = tensor("sqrt_17_cast_fp16")]; + tensor real_div_17_cast_fp16 = real_div(x = sub_34_cast_fp16, y = sqrt_17_cast_fp16)[name = tensor("real_div_17_cast_fp16")]; + tensor reshape_69_shape_0 = const()[name = tensor("reshape_69_shape_0"), val = tensor([2, 1280, 12, 12])]; + tensor reshape_69_cast_fp16 = reshape(shape = reshape_69_shape_0, x = real_div_17_cast_fp16)[name = tensor("reshape_69_cast_fp16")]; + tensor add_35_gamma_0_to_fp16 = const()[name = tensor("add_35_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(283079488)))]; + tensor add_35_beta_0_to_fp16 = const()[name = tensor("add_35_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(283082112)))]; + tensor add_35_epsilon_0_to_fp16 = const()[name = tensor("add_35_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_35_cast_fp16 = batch_norm(beta = add_35_beta_0_to_fp16, epsilon = add_35_epsilon_0_to_fp16, gamma = add_35_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_69_cast_fp16)[name = tensor("add_35_cast_fp16")]; + tensor var_3309 = const()[name = tensor("op_3309"), val = tensor([1, 1])]; + tensor var_3311 = const()[name = tensor("op_3311"), val = tensor([1, 1])]; + tensor hidden_states_97_pad_type_0 = const()[name = tensor("hidden_states_97_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_97_pad_0 = const()[name = tensor("hidden_states_97_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(283084736)))]; + tensor down_blocks_2_attentions_1_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286361600)))]; + tensor hidden_states_97_cast_fp16 = conv(bias = down_blocks_2_attentions_1_proj_in_bias_to_fp16, dilations = var_3311, groups = var_2254, pad = hidden_states_97_pad_0, pad_type = hidden_states_97_pad_type_0, strides = var_3309, weight = down_blocks_2_attentions_1_proj_in_weight_to_fp16, x = add_35_cast_fp16)[name = tensor("hidden_states_97_cast_fp16")]; + tensor var_3316 = const()[name = tensor("op_3316"), val = tensor([2, 1280, 1, 144])]; + tensor inputs_31_cast_fp16 = reshape(shape = var_3316, x = hidden_states_97_cast_fp16)[name = tensor("inputs_31_cast_fp16")]; + tensor var_3326 = const()[name = tensor("op_3326"), val = tensor([1])]; + tensor channels_mean_31_cast_fp16 = reduce_mean(axes = var_3326, keep_dims = var_2249, x = inputs_31_cast_fp16)[name = tensor("channels_mean_31_cast_fp16")]; + tensor zero_mean_31_cast_fp16 = sub(x = inputs_31_cast_fp16, y = channels_mean_31_cast_fp16)[name = tensor("zero_mean_31_cast_fp16")]; + tensor zero_mean_sq_31_cast_fp16 = mul(x = zero_mean_31_cast_fp16, y = zero_mean_31_cast_fp16)[name = tensor("zero_mean_sq_31_cast_fp16")]; + tensor var_3330 = const()[name = tensor("op_3330"), val = tensor([1])]; + tensor var_3331_cast_fp16 = reduce_mean(axes = var_3330, keep_dims = var_2249, x = zero_mean_sq_31_cast_fp16)[name = tensor("op_3331_cast_fp16")]; + tensor var_3332_to_fp16 = const()[name = tensor("op_3332_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_3333_cast_fp16 = add(x = var_3331_cast_fp16, y = var_3332_to_fp16)[name = tensor("op_3333_cast_fp16")]; + tensor denom_31_epsilon_0_to_fp16 = const()[name = tensor("denom_31_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_31_cast_fp16 = rsqrt(epsilon = denom_31_epsilon_0_to_fp16, x = var_3333_cast_fp16)[name = tensor("denom_31_cast_fp16")]; + tensor out_31_cast_fp16 = mul(x = zero_mean_31_cast_fp16, y = denom_31_cast_fp16)[name = tensor("out_31_cast_fp16")]; + tensor var_3337_to_fp16 = const()[name = tensor("op_3337_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286364224)))]; + tensor var_3338_cast_fp16 = add(x = out_31_cast_fp16, y = var_3337_to_fp16)[name = tensor("op_3338_cast_fp16")]; + tensor var_3340_to_fp16 = const()[name = tensor("op_3340_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286366848)))]; + tensor hidden_states_99_cast_fp16 = mul(x = var_3338_cast_fp16, y = var_3340_to_fp16)[name = tensor("hidden_states_99_cast_fp16")]; + tensor var_3347 = const()[name = tensor("op_3347"), val = tensor([1, 1])]; + tensor var_3349 = const()[name = tensor("op_3349"), val = tensor([1, 1])]; + tensor q_21_pad_type_0 = const()[name = tensor("q_21_pad_type_0"), val = tensor("custom")]; + tensor q_21_pad_0 = const()[name = tensor("q_21_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286369472)))]; + tensor q_21_cast_fp16 = conv(dilations = var_3349, groups = var_2254, pad = q_21_pad_0, pad_type = q_21_pad_type_0, strides = var_3347, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_99_cast_fp16)[name = tensor("q_21_cast_fp16")]; + tensor var_3353 = const()[name = tensor("op_3353"), val = tensor([1, 1])]; + tensor var_3355 = const()[name = tensor("op_3355"), val = tensor([1, 1])]; + tensor k_41_pad_type_0 = const()[name = tensor("k_41_pad_type_0"), val = tensor("custom")]; + tensor k_41_pad_0 = const()[name = tensor("k_41_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(289646336)))]; + tensor k_41_cast_fp16 = conv(dilations = var_3355, groups = var_2254, pad = k_41_pad_0, pad_type = k_41_pad_type_0, strides = var_3353, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_99_cast_fp16)[name = tensor("k_41_cast_fp16")]; + tensor var_3359 = const()[name = tensor("op_3359"), val = tensor([1, 1])]; + tensor var_3361 = const()[name = tensor("op_3361"), val = tensor([1, 1])]; + tensor v_21_pad_type_0 = const()[name = tensor("v_21_pad_type_0"), val = tensor("custom")]; + tensor v_21_pad_0 = const()[name = tensor("v_21_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(292923200)))]; + tensor v_21_cast_fp16 = conv(dilations = var_3361, groups = var_2254, pad = v_21_pad_0, pad_type = v_21_pad_type_0, strides = var_3359, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_99_cast_fp16)[name = tensor("v_21_cast_fp16")]; + tensor var_3365_begin_0 = const()[name = tensor("op_3365_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_3365_end_0 = const()[name = tensor("op_3365_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_3365_end_mask_0 = const()[name = tensor("op_3365_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3365_cast_fp16 = slice_by_index(begin = var_3365_begin_0, end = var_3365_end_0, end_mask = var_3365_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3365_cast_fp16")]; + tensor var_3369_begin_0 = const()[name = tensor("op_3369_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_3369_end_0 = const()[name = tensor("op_3369_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_3369_end_mask_0 = const()[name = tensor("op_3369_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3369_cast_fp16 = slice_by_index(begin = var_3369_begin_0, end = var_3369_end_0, end_mask = var_3369_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3369_cast_fp16")]; + tensor var_3373_begin_0 = const()[name = tensor("op_3373_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_3373_end_0 = const()[name = tensor("op_3373_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_3373_end_mask_0 = const()[name = tensor("op_3373_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3373_cast_fp16 = slice_by_index(begin = var_3373_begin_0, end = var_3373_end_0, end_mask = var_3373_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3373_cast_fp16")]; + tensor var_3377_begin_0 = const()[name = tensor("op_3377_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_3377_end_0 = const()[name = tensor("op_3377_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_3377_end_mask_0 = const()[name = tensor("op_3377_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3377_cast_fp16 = slice_by_index(begin = var_3377_begin_0, end = var_3377_end_0, end_mask = var_3377_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3377_cast_fp16")]; + tensor var_3381_begin_0 = const()[name = tensor("op_3381_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_3381_end_0 = const()[name = tensor("op_3381_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_3381_end_mask_0 = const()[name = tensor("op_3381_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3381_cast_fp16 = slice_by_index(begin = var_3381_begin_0, end = var_3381_end_0, end_mask = var_3381_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3381_cast_fp16")]; + tensor var_3385_begin_0 = const()[name = tensor("op_3385_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_3385_end_0 = const()[name = tensor("op_3385_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_3385_end_mask_0 = const()[name = tensor("op_3385_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3385_cast_fp16 = slice_by_index(begin = var_3385_begin_0, end = var_3385_end_0, end_mask = var_3385_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3385_cast_fp16")]; + tensor var_3389_begin_0 = const()[name = tensor("op_3389_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_3389_end_0 = const()[name = tensor("op_3389_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_3389_end_mask_0 = const()[name = tensor("op_3389_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3389_cast_fp16 = slice_by_index(begin = var_3389_begin_0, end = var_3389_end_0, end_mask = var_3389_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3389_cast_fp16")]; + tensor var_3393_begin_0 = const()[name = tensor("op_3393_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_3393_end_0 = const()[name = tensor("op_3393_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_3393_end_mask_0 = const()[name = tensor("op_3393_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3393_cast_fp16 = slice_by_index(begin = var_3393_begin_0, end = var_3393_end_0, end_mask = var_3393_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3393_cast_fp16")]; + tensor var_3397_begin_0 = const()[name = tensor("op_3397_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_3397_end_0 = const()[name = tensor("op_3397_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_3397_end_mask_0 = const()[name = tensor("op_3397_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3397_cast_fp16 = slice_by_index(begin = var_3397_begin_0, end = var_3397_end_0, end_mask = var_3397_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3397_cast_fp16")]; + tensor var_3401_begin_0 = const()[name = tensor("op_3401_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_3401_end_0 = const()[name = tensor("op_3401_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_3401_end_mask_0 = const()[name = tensor("op_3401_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3401_cast_fp16 = slice_by_index(begin = var_3401_begin_0, end = var_3401_end_0, end_mask = var_3401_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3401_cast_fp16")]; + tensor var_3405_begin_0 = const()[name = tensor("op_3405_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_3405_end_0 = const()[name = tensor("op_3405_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_3405_end_mask_0 = const()[name = tensor("op_3405_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3405_cast_fp16 = slice_by_index(begin = var_3405_begin_0, end = var_3405_end_0, end_mask = var_3405_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3405_cast_fp16")]; + tensor var_3409_begin_0 = const()[name = tensor("op_3409_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_3409_end_0 = const()[name = tensor("op_3409_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_3409_end_mask_0 = const()[name = tensor("op_3409_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3409_cast_fp16 = slice_by_index(begin = var_3409_begin_0, end = var_3409_end_0, end_mask = var_3409_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3409_cast_fp16")]; + tensor var_3413_begin_0 = const()[name = tensor("op_3413_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_3413_end_0 = const()[name = tensor("op_3413_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_3413_end_mask_0 = const()[name = tensor("op_3413_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3413_cast_fp16 = slice_by_index(begin = var_3413_begin_0, end = var_3413_end_0, end_mask = var_3413_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3413_cast_fp16")]; + tensor var_3417_begin_0 = const()[name = tensor("op_3417_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_3417_end_0 = const()[name = tensor("op_3417_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_3417_end_mask_0 = const()[name = tensor("op_3417_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3417_cast_fp16 = slice_by_index(begin = var_3417_begin_0, end = var_3417_end_0, end_mask = var_3417_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3417_cast_fp16")]; + tensor var_3421_begin_0 = const()[name = tensor("op_3421_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_3421_end_0 = const()[name = tensor("op_3421_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_3421_end_mask_0 = const()[name = tensor("op_3421_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3421_cast_fp16 = slice_by_index(begin = var_3421_begin_0, end = var_3421_end_0, end_mask = var_3421_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3421_cast_fp16")]; + tensor var_3425_begin_0 = const()[name = tensor("op_3425_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_3425_end_0 = const()[name = tensor("op_3425_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_3425_end_mask_0 = const()[name = tensor("op_3425_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3425_cast_fp16 = slice_by_index(begin = var_3425_begin_0, end = var_3425_end_0, end_mask = var_3425_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3425_cast_fp16")]; + tensor var_3429_begin_0 = const()[name = tensor("op_3429_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_3429_end_0 = const()[name = tensor("op_3429_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_3429_end_mask_0 = const()[name = tensor("op_3429_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3429_cast_fp16 = slice_by_index(begin = var_3429_begin_0, end = var_3429_end_0, end_mask = var_3429_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3429_cast_fp16")]; + tensor var_3433_begin_0 = const()[name = tensor("op_3433_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_3433_end_0 = const()[name = tensor("op_3433_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_3433_end_mask_0 = const()[name = tensor("op_3433_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3433_cast_fp16 = slice_by_index(begin = var_3433_begin_0, end = var_3433_end_0, end_mask = var_3433_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3433_cast_fp16")]; + tensor var_3437_begin_0 = const()[name = tensor("op_3437_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_3437_end_0 = const()[name = tensor("op_3437_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_3437_end_mask_0 = const()[name = tensor("op_3437_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3437_cast_fp16 = slice_by_index(begin = var_3437_begin_0, end = var_3437_end_0, end_mask = var_3437_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3437_cast_fp16")]; + tensor var_3441_begin_0 = const()[name = tensor("op_3441_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_3441_end_0 = const()[name = tensor("op_3441_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_3441_end_mask_0 = const()[name = tensor("op_3441_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3441_cast_fp16 = slice_by_index(begin = var_3441_begin_0, end = var_3441_end_0, end_mask = var_3441_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3441_cast_fp16")]; + tensor k_43_perm_0 = const()[name = tensor("k_43_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_3448_begin_0 = const()[name = tensor("op_3448_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_3448_end_0 = const()[name = tensor("op_3448_end_0"), val = tensor([2, 144, 1, 64])]; + tensor var_3448_end_mask_0 = const()[name = tensor("op_3448_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_21 = transpose(perm = k_43_perm_0, x = k_41_cast_fp16)[name = tensor("transpose_21")]; + tensor var_3448_cast_fp16 = slice_by_index(begin = var_3448_begin_0, end = var_3448_end_0, end_mask = var_3448_end_mask_0, x = transpose_21)[name = tensor("op_3448_cast_fp16")]; + tensor var_3452_begin_0 = const()[name = tensor("op_3452_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_3452_end_0 = const()[name = tensor("op_3452_end_0"), val = tensor([2, 144, 1, 128])]; + tensor var_3452_end_mask_0 = const()[name = tensor("op_3452_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3452_cast_fp16 = slice_by_index(begin = var_3452_begin_0, end = var_3452_end_0, end_mask = var_3452_end_mask_0, x = transpose_21)[name = tensor("op_3452_cast_fp16")]; + tensor var_3456_begin_0 = const()[name = tensor("op_3456_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_3456_end_0 = const()[name = tensor("op_3456_end_0"), val = tensor([2, 144, 1, 192])]; + tensor var_3456_end_mask_0 = const()[name = tensor("op_3456_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3456_cast_fp16 = slice_by_index(begin = var_3456_begin_0, end = var_3456_end_0, end_mask = var_3456_end_mask_0, x = transpose_21)[name = tensor("op_3456_cast_fp16")]; + tensor var_3460_begin_0 = const()[name = tensor("op_3460_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_3460_end_0 = const()[name = tensor("op_3460_end_0"), val = tensor([2, 144, 1, 256])]; + tensor var_3460_end_mask_0 = const()[name = tensor("op_3460_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3460_cast_fp16 = slice_by_index(begin = var_3460_begin_0, end = var_3460_end_0, end_mask = var_3460_end_mask_0, x = transpose_21)[name = tensor("op_3460_cast_fp16")]; + tensor var_3464_begin_0 = const()[name = tensor("op_3464_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_3464_end_0 = const()[name = tensor("op_3464_end_0"), val = tensor([2, 144, 1, 320])]; + tensor var_3464_end_mask_0 = const()[name = tensor("op_3464_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3464_cast_fp16 = slice_by_index(begin = var_3464_begin_0, end = var_3464_end_0, end_mask = var_3464_end_mask_0, x = transpose_21)[name = tensor("op_3464_cast_fp16")]; + tensor var_3468_begin_0 = const()[name = tensor("op_3468_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_3468_end_0 = const()[name = tensor("op_3468_end_0"), val = tensor([2, 144, 1, 384])]; + tensor var_3468_end_mask_0 = const()[name = tensor("op_3468_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3468_cast_fp16 = slice_by_index(begin = var_3468_begin_0, end = var_3468_end_0, end_mask = var_3468_end_mask_0, x = transpose_21)[name = tensor("op_3468_cast_fp16")]; + tensor var_3472_begin_0 = const()[name = tensor("op_3472_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_3472_end_0 = const()[name = tensor("op_3472_end_0"), val = tensor([2, 144, 1, 448])]; + tensor var_3472_end_mask_0 = const()[name = tensor("op_3472_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3472_cast_fp16 = slice_by_index(begin = var_3472_begin_0, end = var_3472_end_0, end_mask = var_3472_end_mask_0, x = transpose_21)[name = tensor("op_3472_cast_fp16")]; + tensor var_3476_begin_0 = const()[name = tensor("op_3476_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_3476_end_0 = const()[name = tensor("op_3476_end_0"), val = tensor([2, 144, 1, 512])]; + tensor var_3476_end_mask_0 = const()[name = tensor("op_3476_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3476_cast_fp16 = slice_by_index(begin = var_3476_begin_0, end = var_3476_end_0, end_mask = var_3476_end_mask_0, x = transpose_21)[name = tensor("op_3476_cast_fp16")]; + tensor var_3480_begin_0 = const()[name = tensor("op_3480_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_3480_end_0 = const()[name = tensor("op_3480_end_0"), val = tensor([2, 144, 1, 576])]; + tensor var_3480_end_mask_0 = const()[name = tensor("op_3480_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3480_cast_fp16 = slice_by_index(begin = var_3480_begin_0, end = var_3480_end_0, end_mask = var_3480_end_mask_0, x = transpose_21)[name = tensor("op_3480_cast_fp16")]; + tensor var_3484_begin_0 = const()[name = tensor("op_3484_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_3484_end_0 = const()[name = tensor("op_3484_end_0"), val = tensor([2, 144, 1, 640])]; + tensor var_3484_end_mask_0 = const()[name = tensor("op_3484_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3484_cast_fp16 = slice_by_index(begin = var_3484_begin_0, end = var_3484_end_0, end_mask = var_3484_end_mask_0, x = transpose_21)[name = tensor("op_3484_cast_fp16")]; + tensor var_3488_begin_0 = const()[name = tensor("op_3488_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_3488_end_0 = const()[name = tensor("op_3488_end_0"), val = tensor([2, 144, 1, 704])]; + tensor var_3488_end_mask_0 = const()[name = tensor("op_3488_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3488_cast_fp16 = slice_by_index(begin = var_3488_begin_0, end = var_3488_end_0, end_mask = var_3488_end_mask_0, x = transpose_21)[name = tensor("op_3488_cast_fp16")]; + tensor var_3492_begin_0 = const()[name = tensor("op_3492_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_3492_end_0 = const()[name = tensor("op_3492_end_0"), val = tensor([2, 144, 1, 768])]; + tensor var_3492_end_mask_0 = const()[name = tensor("op_3492_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3492_cast_fp16 = slice_by_index(begin = var_3492_begin_0, end = var_3492_end_0, end_mask = var_3492_end_mask_0, x = transpose_21)[name = tensor("op_3492_cast_fp16")]; + tensor var_3496_begin_0 = const()[name = tensor("op_3496_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_3496_end_0 = const()[name = tensor("op_3496_end_0"), val = tensor([2, 144, 1, 832])]; + tensor var_3496_end_mask_0 = const()[name = tensor("op_3496_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3496_cast_fp16 = slice_by_index(begin = var_3496_begin_0, end = var_3496_end_0, end_mask = var_3496_end_mask_0, x = transpose_21)[name = tensor("op_3496_cast_fp16")]; + tensor var_3500_begin_0 = const()[name = tensor("op_3500_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_3500_end_0 = const()[name = tensor("op_3500_end_0"), val = tensor([2, 144, 1, 896])]; + tensor var_3500_end_mask_0 = const()[name = tensor("op_3500_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3500_cast_fp16 = slice_by_index(begin = var_3500_begin_0, end = var_3500_end_0, end_mask = var_3500_end_mask_0, x = transpose_21)[name = tensor("op_3500_cast_fp16")]; + tensor var_3504_begin_0 = const()[name = tensor("op_3504_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_3504_end_0 = const()[name = tensor("op_3504_end_0"), val = tensor([2, 144, 1, 960])]; + tensor var_3504_end_mask_0 = const()[name = tensor("op_3504_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3504_cast_fp16 = slice_by_index(begin = var_3504_begin_0, end = var_3504_end_0, end_mask = var_3504_end_mask_0, x = transpose_21)[name = tensor("op_3504_cast_fp16")]; + tensor var_3508_begin_0 = const()[name = tensor("op_3508_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_3508_end_0 = const()[name = tensor("op_3508_end_0"), val = tensor([2, 144, 1, 1024])]; + tensor var_3508_end_mask_0 = const()[name = tensor("op_3508_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3508_cast_fp16 = slice_by_index(begin = var_3508_begin_0, end = var_3508_end_0, end_mask = var_3508_end_mask_0, x = transpose_21)[name = tensor("op_3508_cast_fp16")]; + tensor var_3512_begin_0 = const()[name = tensor("op_3512_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_3512_end_0 = const()[name = tensor("op_3512_end_0"), val = tensor([2, 144, 1, 1088])]; + tensor var_3512_end_mask_0 = const()[name = tensor("op_3512_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3512_cast_fp16 = slice_by_index(begin = var_3512_begin_0, end = var_3512_end_0, end_mask = var_3512_end_mask_0, x = transpose_21)[name = tensor("op_3512_cast_fp16")]; + tensor var_3516_begin_0 = const()[name = tensor("op_3516_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_3516_end_0 = const()[name = tensor("op_3516_end_0"), val = tensor([2, 144, 1, 1152])]; + tensor var_3516_end_mask_0 = const()[name = tensor("op_3516_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3516_cast_fp16 = slice_by_index(begin = var_3516_begin_0, end = var_3516_end_0, end_mask = var_3516_end_mask_0, x = transpose_21)[name = tensor("op_3516_cast_fp16")]; + tensor var_3520_begin_0 = const()[name = tensor("op_3520_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_3520_end_0 = const()[name = tensor("op_3520_end_0"), val = tensor([2, 144, 1, 1216])]; + tensor var_3520_end_mask_0 = const()[name = tensor("op_3520_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3520_cast_fp16 = slice_by_index(begin = var_3520_begin_0, end = var_3520_end_0, end_mask = var_3520_end_mask_0, x = transpose_21)[name = tensor("op_3520_cast_fp16")]; + tensor var_3524_begin_0 = const()[name = tensor("op_3524_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_3524_end_0 = const()[name = tensor("op_3524_end_0"), val = tensor([2, 144, 1, 1280])]; + tensor var_3524_end_mask_0 = const()[name = tensor("op_3524_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3524_cast_fp16 = slice_by_index(begin = var_3524_begin_0, end = var_3524_end_0, end_mask = var_3524_end_mask_0, x = transpose_21)[name = tensor("op_3524_cast_fp16")]; + tensor var_3526_begin_0 = const()[name = tensor("op_3526_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_3526_end_0 = const()[name = tensor("op_3526_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_3526_end_mask_0 = const()[name = tensor("op_3526_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3526_cast_fp16 = slice_by_index(begin = var_3526_begin_0, end = var_3526_end_0, end_mask = var_3526_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3526_cast_fp16")]; + tensor var_3530_begin_0 = const()[name = tensor("op_3530_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_3530_end_0 = const()[name = tensor("op_3530_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_3530_end_mask_0 = const()[name = tensor("op_3530_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3530_cast_fp16 = slice_by_index(begin = var_3530_begin_0, end = var_3530_end_0, end_mask = var_3530_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3530_cast_fp16")]; + tensor var_3534_begin_0 = const()[name = tensor("op_3534_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_3534_end_0 = const()[name = tensor("op_3534_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_3534_end_mask_0 = const()[name = tensor("op_3534_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3534_cast_fp16 = slice_by_index(begin = var_3534_begin_0, end = var_3534_end_0, end_mask = var_3534_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3534_cast_fp16")]; + tensor var_3538_begin_0 = const()[name = tensor("op_3538_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_3538_end_0 = const()[name = tensor("op_3538_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_3538_end_mask_0 = const()[name = tensor("op_3538_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3538_cast_fp16 = slice_by_index(begin = var_3538_begin_0, end = var_3538_end_0, end_mask = var_3538_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3538_cast_fp16")]; + tensor var_3542_begin_0 = const()[name = tensor("op_3542_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_3542_end_0 = const()[name = tensor("op_3542_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_3542_end_mask_0 = const()[name = tensor("op_3542_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3542_cast_fp16 = slice_by_index(begin = var_3542_begin_0, end = var_3542_end_0, end_mask = var_3542_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3542_cast_fp16")]; + tensor var_3546_begin_0 = const()[name = tensor("op_3546_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_3546_end_0 = const()[name = tensor("op_3546_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_3546_end_mask_0 = const()[name = tensor("op_3546_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3546_cast_fp16 = slice_by_index(begin = var_3546_begin_0, end = var_3546_end_0, end_mask = var_3546_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3546_cast_fp16")]; + tensor var_3550_begin_0 = const()[name = tensor("op_3550_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_3550_end_0 = const()[name = tensor("op_3550_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_3550_end_mask_0 = const()[name = tensor("op_3550_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3550_cast_fp16 = slice_by_index(begin = var_3550_begin_0, end = var_3550_end_0, end_mask = var_3550_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3550_cast_fp16")]; + tensor var_3554_begin_0 = const()[name = tensor("op_3554_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_3554_end_0 = const()[name = tensor("op_3554_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_3554_end_mask_0 = const()[name = tensor("op_3554_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3554_cast_fp16 = slice_by_index(begin = var_3554_begin_0, end = var_3554_end_0, end_mask = var_3554_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3554_cast_fp16")]; + tensor var_3558_begin_0 = const()[name = tensor("op_3558_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_3558_end_0 = const()[name = tensor("op_3558_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_3558_end_mask_0 = const()[name = tensor("op_3558_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3558_cast_fp16 = slice_by_index(begin = var_3558_begin_0, end = var_3558_end_0, end_mask = var_3558_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3558_cast_fp16")]; + tensor var_3562_begin_0 = const()[name = tensor("op_3562_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_3562_end_0 = const()[name = tensor("op_3562_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_3562_end_mask_0 = const()[name = tensor("op_3562_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3562_cast_fp16 = slice_by_index(begin = var_3562_begin_0, end = var_3562_end_0, end_mask = var_3562_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3562_cast_fp16")]; + tensor var_3566_begin_0 = const()[name = tensor("op_3566_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_3566_end_0 = const()[name = tensor("op_3566_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_3566_end_mask_0 = const()[name = tensor("op_3566_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3566_cast_fp16 = slice_by_index(begin = var_3566_begin_0, end = var_3566_end_0, end_mask = var_3566_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3566_cast_fp16")]; + tensor var_3570_begin_0 = const()[name = tensor("op_3570_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_3570_end_0 = const()[name = tensor("op_3570_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_3570_end_mask_0 = const()[name = tensor("op_3570_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3570_cast_fp16 = slice_by_index(begin = var_3570_begin_0, end = var_3570_end_0, end_mask = var_3570_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3570_cast_fp16")]; + tensor var_3574_begin_0 = const()[name = tensor("op_3574_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_3574_end_0 = const()[name = tensor("op_3574_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_3574_end_mask_0 = const()[name = tensor("op_3574_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3574_cast_fp16 = slice_by_index(begin = var_3574_begin_0, end = var_3574_end_0, end_mask = var_3574_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3574_cast_fp16")]; + tensor var_3578_begin_0 = const()[name = tensor("op_3578_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_3578_end_0 = const()[name = tensor("op_3578_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_3578_end_mask_0 = const()[name = tensor("op_3578_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3578_cast_fp16 = slice_by_index(begin = var_3578_begin_0, end = var_3578_end_0, end_mask = var_3578_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3578_cast_fp16")]; + tensor var_3582_begin_0 = const()[name = tensor("op_3582_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_3582_end_0 = const()[name = tensor("op_3582_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_3582_end_mask_0 = const()[name = tensor("op_3582_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3582_cast_fp16 = slice_by_index(begin = var_3582_begin_0, end = var_3582_end_0, end_mask = var_3582_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3582_cast_fp16")]; + tensor var_3586_begin_0 = const()[name = tensor("op_3586_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_3586_end_0 = const()[name = tensor("op_3586_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_3586_end_mask_0 = const()[name = tensor("op_3586_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3586_cast_fp16 = slice_by_index(begin = var_3586_begin_0, end = var_3586_end_0, end_mask = var_3586_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3586_cast_fp16")]; + tensor var_3590_begin_0 = const()[name = tensor("op_3590_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_3590_end_0 = const()[name = tensor("op_3590_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_3590_end_mask_0 = const()[name = tensor("op_3590_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3590_cast_fp16 = slice_by_index(begin = var_3590_begin_0, end = var_3590_end_0, end_mask = var_3590_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3590_cast_fp16")]; + tensor var_3594_begin_0 = const()[name = tensor("op_3594_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_3594_end_0 = const()[name = tensor("op_3594_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_3594_end_mask_0 = const()[name = tensor("op_3594_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3594_cast_fp16 = slice_by_index(begin = var_3594_begin_0, end = var_3594_end_0, end_mask = var_3594_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3594_cast_fp16")]; + tensor var_3598_begin_0 = const()[name = tensor("op_3598_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_3598_end_0 = const()[name = tensor("op_3598_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_3598_end_mask_0 = const()[name = tensor("op_3598_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3598_cast_fp16 = slice_by_index(begin = var_3598_begin_0, end = var_3598_end_0, end_mask = var_3598_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3598_cast_fp16")]; + tensor var_3602_begin_0 = const()[name = tensor("op_3602_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_3602_end_0 = const()[name = tensor("op_3602_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_3602_end_mask_0 = const()[name = tensor("op_3602_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3602_cast_fp16 = slice_by_index(begin = var_3602_begin_0, end = var_3602_end_0, end_mask = var_3602_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3602_cast_fp16")]; + tensor var_3606_equation_0 = const()[name = tensor("op_3606_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3606_cast_fp16 = einsum(equation = var_3606_equation_0, values = (var_3448_cast_fp16, var_3365_cast_fp16))[name = tensor("op_3606_cast_fp16")]; + tensor var_3607_to_fp16 = const()[name = tensor("op_3607_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_201_cast_fp16 = mul(x = var_3606_cast_fp16, y = var_3607_to_fp16)[name = tensor("aw_201_cast_fp16")]; + tensor var_3610_equation_0 = const()[name = tensor("op_3610_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3610_cast_fp16 = einsum(equation = var_3610_equation_0, values = (var_3452_cast_fp16, var_3369_cast_fp16))[name = tensor("op_3610_cast_fp16")]; + tensor var_3611_to_fp16 = const()[name = tensor("op_3611_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_203_cast_fp16 = mul(x = var_3610_cast_fp16, y = var_3611_to_fp16)[name = tensor("aw_203_cast_fp16")]; + tensor var_3614_equation_0 = const()[name = tensor("op_3614_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3614_cast_fp16 = einsum(equation = var_3614_equation_0, values = (var_3456_cast_fp16, var_3373_cast_fp16))[name = tensor("op_3614_cast_fp16")]; + tensor var_3615_to_fp16 = const()[name = tensor("op_3615_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_205_cast_fp16 = mul(x = var_3614_cast_fp16, y = var_3615_to_fp16)[name = tensor("aw_205_cast_fp16")]; + tensor var_3618_equation_0 = const()[name = tensor("op_3618_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3618_cast_fp16 = einsum(equation = var_3618_equation_0, values = (var_3460_cast_fp16, var_3377_cast_fp16))[name = tensor("op_3618_cast_fp16")]; + tensor var_3619_to_fp16 = const()[name = tensor("op_3619_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_207_cast_fp16 = mul(x = var_3618_cast_fp16, y = var_3619_to_fp16)[name = tensor("aw_207_cast_fp16")]; + tensor var_3622_equation_0 = const()[name = tensor("op_3622_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3622_cast_fp16 = einsum(equation = var_3622_equation_0, values = (var_3464_cast_fp16, var_3381_cast_fp16))[name = tensor("op_3622_cast_fp16")]; + tensor var_3623_to_fp16 = const()[name = tensor("op_3623_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_209_cast_fp16 = mul(x = var_3622_cast_fp16, y = var_3623_to_fp16)[name = tensor("aw_209_cast_fp16")]; + tensor var_3626_equation_0 = const()[name = tensor("op_3626_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3626_cast_fp16 = einsum(equation = var_3626_equation_0, values = (var_3468_cast_fp16, var_3385_cast_fp16))[name = tensor("op_3626_cast_fp16")]; + tensor var_3627_to_fp16 = const()[name = tensor("op_3627_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_211_cast_fp16 = mul(x = var_3626_cast_fp16, y = var_3627_to_fp16)[name = tensor("aw_211_cast_fp16")]; + tensor var_3630_equation_0 = const()[name = tensor("op_3630_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3630_cast_fp16 = einsum(equation = var_3630_equation_0, values = (var_3472_cast_fp16, var_3389_cast_fp16))[name = tensor("op_3630_cast_fp16")]; + tensor var_3631_to_fp16 = const()[name = tensor("op_3631_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_213_cast_fp16 = mul(x = var_3630_cast_fp16, y = var_3631_to_fp16)[name = tensor("aw_213_cast_fp16")]; + tensor var_3634_equation_0 = const()[name = tensor("op_3634_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3634_cast_fp16 = einsum(equation = var_3634_equation_0, values = (var_3476_cast_fp16, var_3393_cast_fp16))[name = tensor("op_3634_cast_fp16")]; + tensor var_3635_to_fp16 = const()[name = tensor("op_3635_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_215_cast_fp16 = mul(x = var_3634_cast_fp16, y = var_3635_to_fp16)[name = tensor("aw_215_cast_fp16")]; + tensor var_3638_equation_0 = const()[name = tensor("op_3638_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3638_cast_fp16 = einsum(equation = var_3638_equation_0, values = (var_3480_cast_fp16, var_3397_cast_fp16))[name = tensor("op_3638_cast_fp16")]; + tensor var_3639_to_fp16 = const()[name = tensor("op_3639_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_217_cast_fp16 = mul(x = var_3638_cast_fp16, y = var_3639_to_fp16)[name = tensor("aw_217_cast_fp16")]; + tensor var_3642_equation_0 = const()[name = tensor("op_3642_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3642_cast_fp16 = einsum(equation = var_3642_equation_0, values = (var_3484_cast_fp16, var_3401_cast_fp16))[name = tensor("op_3642_cast_fp16")]; + tensor var_3643_to_fp16 = const()[name = tensor("op_3643_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_219_cast_fp16 = mul(x = var_3642_cast_fp16, y = var_3643_to_fp16)[name = tensor("aw_219_cast_fp16")]; + tensor var_3646_equation_0 = const()[name = tensor("op_3646_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3646_cast_fp16 = einsum(equation = var_3646_equation_0, values = (var_3488_cast_fp16, var_3405_cast_fp16))[name = tensor("op_3646_cast_fp16")]; + tensor var_3647_to_fp16 = const()[name = tensor("op_3647_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_221_cast_fp16 = mul(x = var_3646_cast_fp16, y = var_3647_to_fp16)[name = tensor("aw_221_cast_fp16")]; + tensor var_3650_equation_0 = const()[name = tensor("op_3650_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3650_cast_fp16 = einsum(equation = var_3650_equation_0, values = (var_3492_cast_fp16, var_3409_cast_fp16))[name = tensor("op_3650_cast_fp16")]; + tensor var_3651_to_fp16 = const()[name = tensor("op_3651_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_223_cast_fp16 = mul(x = var_3650_cast_fp16, y = var_3651_to_fp16)[name = tensor("aw_223_cast_fp16")]; + tensor var_3654_equation_0 = const()[name = tensor("op_3654_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3654_cast_fp16 = einsum(equation = var_3654_equation_0, values = (var_3496_cast_fp16, var_3413_cast_fp16))[name = tensor("op_3654_cast_fp16")]; + tensor var_3655_to_fp16 = const()[name = tensor("op_3655_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_225_cast_fp16 = mul(x = var_3654_cast_fp16, y = var_3655_to_fp16)[name = tensor("aw_225_cast_fp16")]; + tensor var_3658_equation_0 = const()[name = tensor("op_3658_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3658_cast_fp16 = einsum(equation = var_3658_equation_0, values = (var_3500_cast_fp16, var_3417_cast_fp16))[name = tensor("op_3658_cast_fp16")]; + tensor var_3659_to_fp16 = const()[name = tensor("op_3659_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_227_cast_fp16 = mul(x = var_3658_cast_fp16, y = var_3659_to_fp16)[name = tensor("aw_227_cast_fp16")]; + tensor var_3662_equation_0 = const()[name = tensor("op_3662_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3662_cast_fp16 = einsum(equation = var_3662_equation_0, values = (var_3504_cast_fp16, var_3421_cast_fp16))[name = tensor("op_3662_cast_fp16")]; + tensor var_3663_to_fp16 = const()[name = tensor("op_3663_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_229_cast_fp16 = mul(x = var_3662_cast_fp16, y = var_3663_to_fp16)[name = tensor("aw_229_cast_fp16")]; + tensor var_3666_equation_0 = const()[name = tensor("op_3666_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3666_cast_fp16 = einsum(equation = var_3666_equation_0, values = (var_3508_cast_fp16, var_3425_cast_fp16))[name = tensor("op_3666_cast_fp16")]; + tensor var_3667_to_fp16 = const()[name = tensor("op_3667_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_231_cast_fp16 = mul(x = var_3666_cast_fp16, y = var_3667_to_fp16)[name = tensor("aw_231_cast_fp16")]; + tensor var_3670_equation_0 = const()[name = tensor("op_3670_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3670_cast_fp16 = einsum(equation = var_3670_equation_0, values = (var_3512_cast_fp16, var_3429_cast_fp16))[name = tensor("op_3670_cast_fp16")]; + tensor var_3671_to_fp16 = const()[name = tensor("op_3671_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_233_cast_fp16 = mul(x = var_3670_cast_fp16, y = var_3671_to_fp16)[name = tensor("aw_233_cast_fp16")]; + tensor var_3674_equation_0 = const()[name = tensor("op_3674_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3674_cast_fp16 = einsum(equation = var_3674_equation_0, values = (var_3516_cast_fp16, var_3433_cast_fp16))[name = tensor("op_3674_cast_fp16")]; + tensor var_3675_to_fp16 = const()[name = tensor("op_3675_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_235_cast_fp16 = mul(x = var_3674_cast_fp16, y = var_3675_to_fp16)[name = tensor("aw_235_cast_fp16")]; + tensor var_3678_equation_0 = const()[name = tensor("op_3678_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3678_cast_fp16 = einsum(equation = var_3678_equation_0, values = (var_3520_cast_fp16, var_3437_cast_fp16))[name = tensor("op_3678_cast_fp16")]; + tensor var_3679_to_fp16 = const()[name = tensor("op_3679_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_237_cast_fp16 = mul(x = var_3678_cast_fp16, y = var_3679_to_fp16)[name = tensor("aw_237_cast_fp16")]; + tensor var_3682_equation_0 = const()[name = tensor("op_3682_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_3682_cast_fp16 = einsum(equation = var_3682_equation_0, values = (var_3524_cast_fp16, var_3441_cast_fp16))[name = tensor("op_3682_cast_fp16")]; + tensor var_3683_to_fp16 = const()[name = tensor("op_3683_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_239_cast_fp16 = mul(x = var_3682_cast_fp16, y = var_3683_to_fp16)[name = tensor("aw_239_cast_fp16")]; + tensor var_3685_cast_fp16 = softmax(axis = var_2254, x = aw_201_cast_fp16)[name = tensor("op_3685_cast_fp16")]; + tensor var_3686_cast_fp16 = softmax(axis = var_2254, x = aw_203_cast_fp16)[name = tensor("op_3686_cast_fp16")]; + tensor var_3687_cast_fp16 = softmax(axis = var_2254, x = aw_205_cast_fp16)[name = tensor("op_3687_cast_fp16")]; + tensor var_3688_cast_fp16 = softmax(axis = var_2254, x = aw_207_cast_fp16)[name = tensor("op_3688_cast_fp16")]; + tensor var_3689_cast_fp16 = softmax(axis = var_2254, x = aw_209_cast_fp16)[name = tensor("op_3689_cast_fp16")]; + tensor var_3690_cast_fp16 = softmax(axis = var_2254, x = aw_211_cast_fp16)[name = tensor("op_3690_cast_fp16")]; + tensor var_3691_cast_fp16 = softmax(axis = var_2254, x = aw_213_cast_fp16)[name = tensor("op_3691_cast_fp16")]; + tensor var_3692_cast_fp16 = softmax(axis = var_2254, x = aw_215_cast_fp16)[name = tensor("op_3692_cast_fp16")]; + tensor var_3693_cast_fp16 = softmax(axis = var_2254, x = aw_217_cast_fp16)[name = tensor("op_3693_cast_fp16")]; + tensor var_3694_cast_fp16 = softmax(axis = var_2254, x = aw_219_cast_fp16)[name = tensor("op_3694_cast_fp16")]; + tensor var_3695_cast_fp16 = softmax(axis = var_2254, x = aw_221_cast_fp16)[name = tensor("op_3695_cast_fp16")]; + tensor var_3696_cast_fp16 = softmax(axis = var_2254, x = aw_223_cast_fp16)[name = tensor("op_3696_cast_fp16")]; + tensor var_3697_cast_fp16 = softmax(axis = var_2254, x = aw_225_cast_fp16)[name = tensor("op_3697_cast_fp16")]; + tensor var_3698_cast_fp16 = softmax(axis = var_2254, x = aw_227_cast_fp16)[name = tensor("op_3698_cast_fp16")]; + tensor var_3699_cast_fp16 = softmax(axis = var_2254, x = aw_229_cast_fp16)[name = tensor("op_3699_cast_fp16")]; + tensor var_3700_cast_fp16 = softmax(axis = var_2254, x = aw_231_cast_fp16)[name = tensor("op_3700_cast_fp16")]; + tensor var_3701_cast_fp16 = softmax(axis = var_2254, x = aw_233_cast_fp16)[name = tensor("op_3701_cast_fp16")]; + tensor var_3702_cast_fp16 = softmax(axis = var_2254, x = aw_235_cast_fp16)[name = tensor("op_3702_cast_fp16")]; + tensor var_3703_cast_fp16 = softmax(axis = var_2254, x = aw_237_cast_fp16)[name = tensor("op_3703_cast_fp16")]; + tensor var_3704_cast_fp16 = softmax(axis = var_2254, x = aw_239_cast_fp16)[name = tensor("op_3704_cast_fp16")]; + tensor var_3706_equation_0 = const()[name = tensor("op_3706_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3706_cast_fp16 = einsum(equation = var_3706_equation_0, values = (var_3526_cast_fp16, var_3685_cast_fp16))[name = tensor("op_3706_cast_fp16")]; + tensor var_3708_equation_0 = const()[name = tensor("op_3708_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3708_cast_fp16 = einsum(equation = var_3708_equation_0, values = (var_3530_cast_fp16, var_3686_cast_fp16))[name = tensor("op_3708_cast_fp16")]; + tensor var_3710_equation_0 = const()[name = tensor("op_3710_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3710_cast_fp16 = einsum(equation = var_3710_equation_0, values = (var_3534_cast_fp16, var_3687_cast_fp16))[name = tensor("op_3710_cast_fp16")]; + tensor var_3712_equation_0 = const()[name = tensor("op_3712_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3712_cast_fp16 = einsum(equation = var_3712_equation_0, values = (var_3538_cast_fp16, var_3688_cast_fp16))[name = tensor("op_3712_cast_fp16")]; + tensor var_3714_equation_0 = const()[name = tensor("op_3714_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3714_cast_fp16 = einsum(equation = var_3714_equation_0, values = (var_3542_cast_fp16, var_3689_cast_fp16))[name = tensor("op_3714_cast_fp16")]; + tensor var_3716_equation_0 = const()[name = tensor("op_3716_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3716_cast_fp16 = einsum(equation = var_3716_equation_0, values = (var_3546_cast_fp16, var_3690_cast_fp16))[name = tensor("op_3716_cast_fp16")]; + tensor var_3718_equation_0 = const()[name = tensor("op_3718_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3718_cast_fp16 = einsum(equation = var_3718_equation_0, values = (var_3550_cast_fp16, var_3691_cast_fp16))[name = tensor("op_3718_cast_fp16")]; + tensor var_3720_equation_0 = const()[name = tensor("op_3720_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3720_cast_fp16 = einsum(equation = var_3720_equation_0, values = (var_3554_cast_fp16, var_3692_cast_fp16))[name = tensor("op_3720_cast_fp16")]; + tensor var_3722_equation_0 = const()[name = tensor("op_3722_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3722_cast_fp16 = einsum(equation = var_3722_equation_0, values = (var_3558_cast_fp16, var_3693_cast_fp16))[name = tensor("op_3722_cast_fp16")]; + tensor var_3724_equation_0 = const()[name = tensor("op_3724_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3724_cast_fp16 = einsum(equation = var_3724_equation_0, values = (var_3562_cast_fp16, var_3694_cast_fp16))[name = tensor("op_3724_cast_fp16")]; + tensor var_3726_equation_0 = const()[name = tensor("op_3726_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3726_cast_fp16 = einsum(equation = var_3726_equation_0, values = (var_3566_cast_fp16, var_3695_cast_fp16))[name = tensor("op_3726_cast_fp16")]; + tensor var_3728_equation_0 = const()[name = tensor("op_3728_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3728_cast_fp16 = einsum(equation = var_3728_equation_0, values = (var_3570_cast_fp16, var_3696_cast_fp16))[name = tensor("op_3728_cast_fp16")]; + tensor var_3730_equation_0 = const()[name = tensor("op_3730_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3730_cast_fp16 = einsum(equation = var_3730_equation_0, values = (var_3574_cast_fp16, var_3697_cast_fp16))[name = tensor("op_3730_cast_fp16")]; + tensor var_3732_equation_0 = const()[name = tensor("op_3732_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3732_cast_fp16 = einsum(equation = var_3732_equation_0, values = (var_3578_cast_fp16, var_3698_cast_fp16))[name = tensor("op_3732_cast_fp16")]; + tensor var_3734_equation_0 = const()[name = tensor("op_3734_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3734_cast_fp16 = einsum(equation = var_3734_equation_0, values = (var_3582_cast_fp16, var_3699_cast_fp16))[name = tensor("op_3734_cast_fp16")]; + tensor var_3736_equation_0 = const()[name = tensor("op_3736_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3736_cast_fp16 = einsum(equation = var_3736_equation_0, values = (var_3586_cast_fp16, var_3700_cast_fp16))[name = tensor("op_3736_cast_fp16")]; + tensor var_3738_equation_0 = const()[name = tensor("op_3738_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3738_cast_fp16 = einsum(equation = var_3738_equation_0, values = (var_3590_cast_fp16, var_3701_cast_fp16))[name = tensor("op_3738_cast_fp16")]; + tensor var_3740_equation_0 = const()[name = tensor("op_3740_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3740_cast_fp16 = einsum(equation = var_3740_equation_0, values = (var_3594_cast_fp16, var_3702_cast_fp16))[name = tensor("op_3740_cast_fp16")]; + tensor var_3742_equation_0 = const()[name = tensor("op_3742_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3742_cast_fp16 = einsum(equation = var_3742_equation_0, values = (var_3598_cast_fp16, var_3703_cast_fp16))[name = tensor("op_3742_cast_fp16")]; + tensor var_3744_equation_0 = const()[name = tensor("op_3744_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_3744_cast_fp16 = einsum(equation = var_3744_equation_0, values = (var_3602_cast_fp16, var_3704_cast_fp16))[name = tensor("op_3744_cast_fp16")]; + tensor input_159_interleave_0 = const()[name = tensor("input_159_interleave_0"), val = tensor(false)]; + tensor input_159_cast_fp16 = concat(axis = var_2254, interleave = input_159_interleave_0, values = (var_3706_cast_fp16, var_3708_cast_fp16, var_3710_cast_fp16, var_3712_cast_fp16, var_3714_cast_fp16, var_3716_cast_fp16, var_3718_cast_fp16, var_3720_cast_fp16, var_3722_cast_fp16, var_3724_cast_fp16, var_3726_cast_fp16, var_3728_cast_fp16, var_3730_cast_fp16, var_3732_cast_fp16, var_3734_cast_fp16, var_3736_cast_fp16, var_3738_cast_fp16, var_3740_cast_fp16, var_3742_cast_fp16, var_3744_cast_fp16))[name = tensor("input_159_cast_fp16")]; + tensor var_3750 = const()[name = tensor("op_3750"), val = tensor([1, 1])]; + tensor var_3752 = const()[name = tensor("op_3752"), val = tensor([1, 1])]; + tensor var_3754_pad_type_0 = const()[name = tensor("op_3754_pad_type_0"), val = tensor("custom")]; + tensor var_3754_pad_0 = const()[name = tensor("op_3754_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(296200064)))]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299476928)))]; + tensor var_3754_cast_fp16 = conv(bias = down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_3752, groups = var_2254, pad = var_3754_pad_0, pad_type = var_3754_pad_type_0, strides = var_3750, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_159_cast_fp16)[name = tensor("op_3754_cast_fp16")]; + tensor inputs_33_cast_fp16 = add(x = var_3754_cast_fp16, y = inputs_31_cast_fp16)[name = tensor("inputs_33_cast_fp16")]; + tensor var_3758 = const()[name = tensor("op_3758"), val = tensor([1])]; + tensor channels_mean_33_cast_fp16 = reduce_mean(axes = var_3758, keep_dims = var_2249, x = inputs_33_cast_fp16)[name = tensor("channels_mean_33_cast_fp16")]; + tensor zero_mean_33_cast_fp16 = sub(x = inputs_33_cast_fp16, y = channels_mean_33_cast_fp16)[name = tensor("zero_mean_33_cast_fp16")]; + tensor zero_mean_sq_33_cast_fp16 = mul(x = zero_mean_33_cast_fp16, y = zero_mean_33_cast_fp16)[name = tensor("zero_mean_sq_33_cast_fp16")]; + tensor var_3762 = const()[name = tensor("op_3762"), val = tensor([1])]; + tensor var_3763_cast_fp16 = reduce_mean(axes = var_3762, keep_dims = var_2249, x = zero_mean_sq_33_cast_fp16)[name = tensor("op_3763_cast_fp16")]; + tensor var_3764_to_fp16 = const()[name = tensor("op_3764_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_3765_cast_fp16 = add(x = var_3763_cast_fp16, y = var_3764_to_fp16)[name = tensor("op_3765_cast_fp16")]; + tensor denom_33_epsilon_0_to_fp16 = const()[name = tensor("denom_33_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_33_cast_fp16 = rsqrt(epsilon = denom_33_epsilon_0_to_fp16, x = var_3765_cast_fp16)[name = tensor("denom_33_cast_fp16")]; + tensor out_33_cast_fp16 = mul(x = zero_mean_33_cast_fp16, y = denom_33_cast_fp16)[name = tensor("out_33_cast_fp16")]; + tensor var_3769_to_fp16 = const()[name = tensor("op_3769_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299479552)))]; + tensor var_3770_cast_fp16 = add(x = out_33_cast_fp16, y = var_3769_to_fp16)[name = tensor("op_3770_cast_fp16")]; + tensor var_3772_to_fp16 = const()[name = tensor("op_3772_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299482176)))]; + tensor hidden_states_101_cast_fp16 = mul(x = var_3770_cast_fp16, y = var_3772_to_fp16)[name = tensor("hidden_states_101_cast_fp16")]; + tensor var_3779 = const()[name = tensor("op_3779"), val = tensor([1, 1])]; + tensor var_3781 = const()[name = tensor("op_3781"), val = tensor([1, 1])]; + tensor q_23_pad_type_0 = const()[name = tensor("q_23_pad_type_0"), val = tensor("custom")]; + tensor q_23_pad_0 = const()[name = tensor("q_23_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299484800)))]; + tensor q_23_cast_fp16 = conv(dilations = var_3781, groups = var_2254, pad = q_23_pad_0, pad_type = q_23_pad_type_0, strides = var_3779, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_101_cast_fp16)[name = tensor("q_23_cast_fp16")]; + tensor var_3785 = const()[name = tensor("op_3785"), val = tensor([1, 1])]; + tensor var_3787 = const()[name = tensor("op_3787"), val = tensor([1, 1])]; + tensor k_45_pad_type_0 = const()[name = tensor("k_45_pad_type_0"), val = tensor("custom")]; + tensor k_45_pad_0 = const()[name = tensor("k_45_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(302761664)))]; + tensor k_45_cast_fp16 = conv(dilations = var_3787, groups = var_2254, pad = k_45_pad_0, pad_type = k_45_pad_type_0, strides = var_3785, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_45_cast_fp16")]; + tensor var_3791 = const()[name = tensor("op_3791"), val = tensor([1, 1])]; + tensor var_3793 = const()[name = tensor("op_3793"), val = tensor([1, 1])]; + tensor v_23_pad_type_0 = const()[name = tensor("v_23_pad_type_0"), val = tensor("custom")]; + tensor v_23_pad_0 = const()[name = tensor("v_23_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(305383168)))]; + tensor v_23_cast_fp16 = conv(dilations = var_3793, groups = var_2254, pad = v_23_pad_0, pad_type = v_23_pad_type_0, strides = var_3791, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_23_cast_fp16")]; + tensor var_3797_begin_0 = const()[name = tensor("op_3797_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_3797_end_0 = const()[name = tensor("op_3797_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_3797_end_mask_0 = const()[name = tensor("op_3797_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3797_cast_fp16 = slice_by_index(begin = var_3797_begin_0, end = var_3797_end_0, end_mask = var_3797_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3797_cast_fp16")]; + tensor var_3801_begin_0 = const()[name = tensor("op_3801_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_3801_end_0 = const()[name = tensor("op_3801_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_3801_end_mask_0 = const()[name = tensor("op_3801_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3801_cast_fp16 = slice_by_index(begin = var_3801_begin_0, end = var_3801_end_0, end_mask = var_3801_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3801_cast_fp16")]; + tensor var_3805_begin_0 = const()[name = tensor("op_3805_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_3805_end_0 = const()[name = tensor("op_3805_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_3805_end_mask_0 = const()[name = tensor("op_3805_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3805_cast_fp16 = slice_by_index(begin = var_3805_begin_0, end = var_3805_end_0, end_mask = var_3805_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3805_cast_fp16")]; + tensor var_3809_begin_0 = const()[name = tensor("op_3809_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_3809_end_0 = const()[name = tensor("op_3809_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_3809_end_mask_0 = const()[name = tensor("op_3809_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3809_cast_fp16 = slice_by_index(begin = var_3809_begin_0, end = var_3809_end_0, end_mask = var_3809_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3809_cast_fp16")]; + tensor var_3813_begin_0 = const()[name = tensor("op_3813_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_3813_end_0 = const()[name = tensor("op_3813_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_3813_end_mask_0 = const()[name = tensor("op_3813_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3813_cast_fp16 = slice_by_index(begin = var_3813_begin_0, end = var_3813_end_0, end_mask = var_3813_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3813_cast_fp16")]; + tensor var_3817_begin_0 = const()[name = tensor("op_3817_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_3817_end_0 = const()[name = tensor("op_3817_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_3817_end_mask_0 = const()[name = tensor("op_3817_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3817_cast_fp16 = slice_by_index(begin = var_3817_begin_0, end = var_3817_end_0, end_mask = var_3817_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3817_cast_fp16")]; + tensor var_3821_begin_0 = const()[name = tensor("op_3821_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_3821_end_0 = const()[name = tensor("op_3821_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_3821_end_mask_0 = const()[name = tensor("op_3821_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3821_cast_fp16 = slice_by_index(begin = var_3821_begin_0, end = var_3821_end_0, end_mask = var_3821_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3821_cast_fp16")]; + tensor var_3825_begin_0 = const()[name = tensor("op_3825_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_3825_end_0 = const()[name = tensor("op_3825_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_3825_end_mask_0 = const()[name = tensor("op_3825_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3825_cast_fp16 = slice_by_index(begin = var_3825_begin_0, end = var_3825_end_0, end_mask = var_3825_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3825_cast_fp16")]; + tensor var_3829_begin_0 = const()[name = tensor("op_3829_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_3829_end_0 = const()[name = tensor("op_3829_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_3829_end_mask_0 = const()[name = tensor("op_3829_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3829_cast_fp16 = slice_by_index(begin = var_3829_begin_0, end = var_3829_end_0, end_mask = var_3829_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3829_cast_fp16")]; + tensor var_3833_begin_0 = const()[name = tensor("op_3833_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_3833_end_0 = const()[name = tensor("op_3833_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_3833_end_mask_0 = const()[name = tensor("op_3833_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3833_cast_fp16 = slice_by_index(begin = var_3833_begin_0, end = var_3833_end_0, end_mask = var_3833_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3833_cast_fp16")]; + tensor var_3837_begin_0 = const()[name = tensor("op_3837_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_3837_end_0 = const()[name = tensor("op_3837_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_3837_end_mask_0 = const()[name = tensor("op_3837_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3837_cast_fp16 = slice_by_index(begin = var_3837_begin_0, end = var_3837_end_0, end_mask = var_3837_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3837_cast_fp16")]; + tensor var_3841_begin_0 = const()[name = tensor("op_3841_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_3841_end_0 = const()[name = tensor("op_3841_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_3841_end_mask_0 = const()[name = tensor("op_3841_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3841_cast_fp16 = slice_by_index(begin = var_3841_begin_0, end = var_3841_end_0, end_mask = var_3841_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3841_cast_fp16")]; + tensor var_3845_begin_0 = const()[name = tensor("op_3845_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_3845_end_0 = const()[name = tensor("op_3845_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_3845_end_mask_0 = const()[name = tensor("op_3845_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3845_cast_fp16 = slice_by_index(begin = var_3845_begin_0, end = var_3845_end_0, end_mask = var_3845_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3845_cast_fp16")]; + tensor var_3849_begin_0 = const()[name = tensor("op_3849_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_3849_end_0 = const()[name = tensor("op_3849_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_3849_end_mask_0 = const()[name = tensor("op_3849_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3849_cast_fp16 = slice_by_index(begin = var_3849_begin_0, end = var_3849_end_0, end_mask = var_3849_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3849_cast_fp16")]; + tensor var_3853_begin_0 = const()[name = tensor("op_3853_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_3853_end_0 = const()[name = tensor("op_3853_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_3853_end_mask_0 = const()[name = tensor("op_3853_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3853_cast_fp16 = slice_by_index(begin = var_3853_begin_0, end = var_3853_end_0, end_mask = var_3853_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3853_cast_fp16")]; + tensor var_3857_begin_0 = const()[name = tensor("op_3857_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_3857_end_0 = const()[name = tensor("op_3857_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_3857_end_mask_0 = const()[name = tensor("op_3857_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3857_cast_fp16 = slice_by_index(begin = var_3857_begin_0, end = var_3857_end_0, end_mask = var_3857_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3857_cast_fp16")]; + tensor var_3861_begin_0 = const()[name = tensor("op_3861_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_3861_end_0 = const()[name = tensor("op_3861_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_3861_end_mask_0 = const()[name = tensor("op_3861_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3861_cast_fp16 = slice_by_index(begin = var_3861_begin_0, end = var_3861_end_0, end_mask = var_3861_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3861_cast_fp16")]; + tensor var_3865_begin_0 = const()[name = tensor("op_3865_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_3865_end_0 = const()[name = tensor("op_3865_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_3865_end_mask_0 = const()[name = tensor("op_3865_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3865_cast_fp16 = slice_by_index(begin = var_3865_begin_0, end = var_3865_end_0, end_mask = var_3865_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3865_cast_fp16")]; + tensor var_3869_begin_0 = const()[name = tensor("op_3869_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_3869_end_0 = const()[name = tensor("op_3869_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_3869_end_mask_0 = const()[name = tensor("op_3869_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3869_cast_fp16 = slice_by_index(begin = var_3869_begin_0, end = var_3869_end_0, end_mask = var_3869_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3869_cast_fp16")]; + tensor var_3873_begin_0 = const()[name = tensor("op_3873_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_3873_end_0 = const()[name = tensor("op_3873_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_3873_end_mask_0 = const()[name = tensor("op_3873_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3873_cast_fp16 = slice_by_index(begin = var_3873_begin_0, end = var_3873_end_0, end_mask = var_3873_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3873_cast_fp16")]; + tensor k_47_perm_0 = const()[name = tensor("k_47_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_3880_begin_0 = const()[name = tensor("op_3880_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_3880_end_0 = const()[name = tensor("op_3880_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_3880_end_mask_0 = const()[name = tensor("op_3880_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_20 = transpose(perm = k_47_perm_0, x = k_45_cast_fp16)[name = tensor("transpose_20")]; + tensor var_3880_cast_fp16 = slice_by_index(begin = var_3880_begin_0, end = var_3880_end_0, end_mask = var_3880_end_mask_0, x = transpose_20)[name = tensor("op_3880_cast_fp16")]; + tensor var_3884_begin_0 = const()[name = tensor("op_3884_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_3884_end_0 = const()[name = tensor("op_3884_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_3884_end_mask_0 = const()[name = tensor("op_3884_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3884_cast_fp16 = slice_by_index(begin = var_3884_begin_0, end = var_3884_end_0, end_mask = var_3884_end_mask_0, x = transpose_20)[name = tensor("op_3884_cast_fp16")]; + tensor var_3888_begin_0 = const()[name = tensor("op_3888_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_3888_end_0 = const()[name = tensor("op_3888_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_3888_end_mask_0 = const()[name = tensor("op_3888_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3888_cast_fp16 = slice_by_index(begin = var_3888_begin_0, end = var_3888_end_0, end_mask = var_3888_end_mask_0, x = transpose_20)[name = tensor("op_3888_cast_fp16")]; + tensor var_3892_begin_0 = const()[name = tensor("op_3892_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_3892_end_0 = const()[name = tensor("op_3892_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_3892_end_mask_0 = const()[name = tensor("op_3892_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3892_cast_fp16 = slice_by_index(begin = var_3892_begin_0, end = var_3892_end_0, end_mask = var_3892_end_mask_0, x = transpose_20)[name = tensor("op_3892_cast_fp16")]; + tensor var_3896_begin_0 = const()[name = tensor("op_3896_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_3896_end_0 = const()[name = tensor("op_3896_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_3896_end_mask_0 = const()[name = tensor("op_3896_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3896_cast_fp16 = slice_by_index(begin = var_3896_begin_0, end = var_3896_end_0, end_mask = var_3896_end_mask_0, x = transpose_20)[name = tensor("op_3896_cast_fp16")]; + tensor var_3900_begin_0 = const()[name = tensor("op_3900_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_3900_end_0 = const()[name = tensor("op_3900_end_0"), val = tensor([2, 77, 1, 384])]; + tensor var_3900_end_mask_0 = const()[name = tensor("op_3900_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3900_cast_fp16 = slice_by_index(begin = var_3900_begin_0, end = var_3900_end_0, end_mask = var_3900_end_mask_0, x = transpose_20)[name = tensor("op_3900_cast_fp16")]; + tensor var_3904_begin_0 = const()[name = tensor("op_3904_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_3904_end_0 = const()[name = tensor("op_3904_end_0"), val = tensor([2, 77, 1, 448])]; + tensor var_3904_end_mask_0 = const()[name = tensor("op_3904_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3904_cast_fp16 = slice_by_index(begin = var_3904_begin_0, end = var_3904_end_0, end_mask = var_3904_end_mask_0, x = transpose_20)[name = tensor("op_3904_cast_fp16")]; + tensor var_3908_begin_0 = const()[name = tensor("op_3908_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_3908_end_0 = const()[name = tensor("op_3908_end_0"), val = tensor([2, 77, 1, 512])]; + tensor var_3908_end_mask_0 = const()[name = tensor("op_3908_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3908_cast_fp16 = slice_by_index(begin = var_3908_begin_0, end = var_3908_end_0, end_mask = var_3908_end_mask_0, x = transpose_20)[name = tensor("op_3908_cast_fp16")]; + tensor var_3912_begin_0 = const()[name = tensor("op_3912_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_3912_end_0 = const()[name = tensor("op_3912_end_0"), val = tensor([2, 77, 1, 576])]; + tensor var_3912_end_mask_0 = const()[name = tensor("op_3912_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3912_cast_fp16 = slice_by_index(begin = var_3912_begin_0, end = var_3912_end_0, end_mask = var_3912_end_mask_0, x = transpose_20)[name = tensor("op_3912_cast_fp16")]; + tensor var_3916_begin_0 = const()[name = tensor("op_3916_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_3916_end_0 = const()[name = tensor("op_3916_end_0"), val = tensor([2, 77, 1, 640])]; + tensor var_3916_end_mask_0 = const()[name = tensor("op_3916_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3916_cast_fp16 = slice_by_index(begin = var_3916_begin_0, end = var_3916_end_0, end_mask = var_3916_end_mask_0, x = transpose_20)[name = tensor("op_3916_cast_fp16")]; + tensor var_3920_begin_0 = const()[name = tensor("op_3920_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_3920_end_0 = const()[name = tensor("op_3920_end_0"), val = tensor([2, 77, 1, 704])]; + tensor var_3920_end_mask_0 = const()[name = tensor("op_3920_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3920_cast_fp16 = slice_by_index(begin = var_3920_begin_0, end = var_3920_end_0, end_mask = var_3920_end_mask_0, x = transpose_20)[name = tensor("op_3920_cast_fp16")]; + tensor var_3924_begin_0 = const()[name = tensor("op_3924_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_3924_end_0 = const()[name = tensor("op_3924_end_0"), val = tensor([2, 77, 1, 768])]; + tensor var_3924_end_mask_0 = const()[name = tensor("op_3924_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3924_cast_fp16 = slice_by_index(begin = var_3924_begin_0, end = var_3924_end_0, end_mask = var_3924_end_mask_0, x = transpose_20)[name = tensor("op_3924_cast_fp16")]; + tensor var_3928_begin_0 = const()[name = tensor("op_3928_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_3928_end_0 = const()[name = tensor("op_3928_end_0"), val = tensor([2, 77, 1, 832])]; + tensor var_3928_end_mask_0 = const()[name = tensor("op_3928_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3928_cast_fp16 = slice_by_index(begin = var_3928_begin_0, end = var_3928_end_0, end_mask = var_3928_end_mask_0, x = transpose_20)[name = tensor("op_3928_cast_fp16")]; + tensor var_3932_begin_0 = const()[name = tensor("op_3932_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_3932_end_0 = const()[name = tensor("op_3932_end_0"), val = tensor([2, 77, 1, 896])]; + tensor var_3932_end_mask_0 = const()[name = tensor("op_3932_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3932_cast_fp16 = slice_by_index(begin = var_3932_begin_0, end = var_3932_end_0, end_mask = var_3932_end_mask_0, x = transpose_20)[name = tensor("op_3932_cast_fp16")]; + tensor var_3936_begin_0 = const()[name = tensor("op_3936_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_3936_end_0 = const()[name = tensor("op_3936_end_0"), val = tensor([2, 77, 1, 960])]; + tensor var_3936_end_mask_0 = const()[name = tensor("op_3936_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3936_cast_fp16 = slice_by_index(begin = var_3936_begin_0, end = var_3936_end_0, end_mask = var_3936_end_mask_0, x = transpose_20)[name = tensor("op_3936_cast_fp16")]; + tensor var_3940_begin_0 = const()[name = tensor("op_3940_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_3940_end_0 = const()[name = tensor("op_3940_end_0"), val = tensor([2, 77, 1, 1024])]; + tensor var_3940_end_mask_0 = const()[name = tensor("op_3940_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3940_cast_fp16 = slice_by_index(begin = var_3940_begin_0, end = var_3940_end_0, end_mask = var_3940_end_mask_0, x = transpose_20)[name = tensor("op_3940_cast_fp16")]; + tensor var_3944_begin_0 = const()[name = tensor("op_3944_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_3944_end_0 = const()[name = tensor("op_3944_end_0"), val = tensor([2, 77, 1, 1088])]; + tensor var_3944_end_mask_0 = const()[name = tensor("op_3944_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3944_cast_fp16 = slice_by_index(begin = var_3944_begin_0, end = var_3944_end_0, end_mask = var_3944_end_mask_0, x = transpose_20)[name = tensor("op_3944_cast_fp16")]; + tensor var_3948_begin_0 = const()[name = tensor("op_3948_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_3948_end_0 = const()[name = tensor("op_3948_end_0"), val = tensor([2, 77, 1, 1152])]; + tensor var_3948_end_mask_0 = const()[name = tensor("op_3948_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3948_cast_fp16 = slice_by_index(begin = var_3948_begin_0, end = var_3948_end_0, end_mask = var_3948_end_mask_0, x = transpose_20)[name = tensor("op_3948_cast_fp16")]; + tensor var_3952_begin_0 = const()[name = tensor("op_3952_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_3952_end_0 = const()[name = tensor("op_3952_end_0"), val = tensor([2, 77, 1, 1216])]; + tensor var_3952_end_mask_0 = const()[name = tensor("op_3952_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3952_cast_fp16 = slice_by_index(begin = var_3952_begin_0, end = var_3952_end_0, end_mask = var_3952_end_mask_0, x = transpose_20)[name = tensor("op_3952_cast_fp16")]; + tensor var_3956_begin_0 = const()[name = tensor("op_3956_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_3956_end_0 = const()[name = tensor("op_3956_end_0"), val = tensor([2, 77, 1, 1280])]; + tensor var_3956_end_mask_0 = const()[name = tensor("op_3956_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_3956_cast_fp16 = slice_by_index(begin = var_3956_begin_0, end = var_3956_end_0, end_mask = var_3956_end_mask_0, x = transpose_20)[name = tensor("op_3956_cast_fp16")]; + tensor var_3958_begin_0 = const()[name = tensor("op_3958_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_3958_end_0 = const()[name = tensor("op_3958_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_3958_end_mask_0 = const()[name = tensor("op_3958_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3958_cast_fp16 = slice_by_index(begin = var_3958_begin_0, end = var_3958_end_0, end_mask = var_3958_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3958_cast_fp16")]; + tensor var_3962_begin_0 = const()[name = tensor("op_3962_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_3962_end_0 = const()[name = tensor("op_3962_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_3962_end_mask_0 = const()[name = tensor("op_3962_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3962_cast_fp16 = slice_by_index(begin = var_3962_begin_0, end = var_3962_end_0, end_mask = var_3962_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3962_cast_fp16")]; + tensor var_3966_begin_0 = const()[name = tensor("op_3966_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_3966_end_0 = const()[name = tensor("op_3966_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_3966_end_mask_0 = const()[name = tensor("op_3966_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3966_cast_fp16 = slice_by_index(begin = var_3966_begin_0, end = var_3966_end_0, end_mask = var_3966_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3966_cast_fp16")]; + tensor var_3970_begin_0 = const()[name = tensor("op_3970_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_3970_end_0 = const()[name = tensor("op_3970_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_3970_end_mask_0 = const()[name = tensor("op_3970_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3970_cast_fp16 = slice_by_index(begin = var_3970_begin_0, end = var_3970_end_0, end_mask = var_3970_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3970_cast_fp16")]; + tensor var_3974_begin_0 = const()[name = tensor("op_3974_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_3974_end_0 = const()[name = tensor("op_3974_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_3974_end_mask_0 = const()[name = tensor("op_3974_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3974_cast_fp16 = slice_by_index(begin = var_3974_begin_0, end = var_3974_end_0, end_mask = var_3974_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3974_cast_fp16")]; + tensor var_3978_begin_0 = const()[name = tensor("op_3978_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_3978_end_0 = const()[name = tensor("op_3978_end_0"), val = tensor([2, 384, 1, 77])]; + tensor var_3978_end_mask_0 = const()[name = tensor("op_3978_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3978_cast_fp16 = slice_by_index(begin = var_3978_begin_0, end = var_3978_end_0, end_mask = var_3978_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3978_cast_fp16")]; + tensor var_3982_begin_0 = const()[name = tensor("op_3982_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_3982_end_0 = const()[name = tensor("op_3982_end_0"), val = tensor([2, 448, 1, 77])]; + tensor var_3982_end_mask_0 = const()[name = tensor("op_3982_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3982_cast_fp16 = slice_by_index(begin = var_3982_begin_0, end = var_3982_end_0, end_mask = var_3982_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3982_cast_fp16")]; + tensor var_3986_begin_0 = const()[name = tensor("op_3986_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_3986_end_0 = const()[name = tensor("op_3986_end_0"), val = tensor([2, 512, 1, 77])]; + tensor var_3986_end_mask_0 = const()[name = tensor("op_3986_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3986_cast_fp16 = slice_by_index(begin = var_3986_begin_0, end = var_3986_end_0, end_mask = var_3986_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3986_cast_fp16")]; + tensor var_3990_begin_0 = const()[name = tensor("op_3990_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_3990_end_0 = const()[name = tensor("op_3990_end_0"), val = tensor([2, 576, 1, 77])]; + tensor var_3990_end_mask_0 = const()[name = tensor("op_3990_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3990_cast_fp16 = slice_by_index(begin = var_3990_begin_0, end = var_3990_end_0, end_mask = var_3990_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3990_cast_fp16")]; + tensor var_3994_begin_0 = const()[name = tensor("op_3994_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_3994_end_0 = const()[name = tensor("op_3994_end_0"), val = tensor([2, 640, 1, 77])]; + tensor var_3994_end_mask_0 = const()[name = tensor("op_3994_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3994_cast_fp16 = slice_by_index(begin = var_3994_begin_0, end = var_3994_end_0, end_mask = var_3994_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3994_cast_fp16")]; + tensor var_3998_begin_0 = const()[name = tensor("op_3998_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_3998_end_0 = const()[name = tensor("op_3998_end_0"), val = tensor([2, 704, 1, 77])]; + tensor var_3998_end_mask_0 = const()[name = tensor("op_3998_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_3998_cast_fp16 = slice_by_index(begin = var_3998_begin_0, end = var_3998_end_0, end_mask = var_3998_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3998_cast_fp16")]; + tensor var_4002_begin_0 = const()[name = tensor("op_4002_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_4002_end_0 = const()[name = tensor("op_4002_end_0"), val = tensor([2, 768, 1, 77])]; + tensor var_4002_end_mask_0 = const()[name = tensor("op_4002_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4002_cast_fp16 = slice_by_index(begin = var_4002_begin_0, end = var_4002_end_0, end_mask = var_4002_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4002_cast_fp16")]; + tensor var_4006_begin_0 = const()[name = tensor("op_4006_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_4006_end_0 = const()[name = tensor("op_4006_end_0"), val = tensor([2, 832, 1, 77])]; + tensor var_4006_end_mask_0 = const()[name = tensor("op_4006_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4006_cast_fp16 = slice_by_index(begin = var_4006_begin_0, end = var_4006_end_0, end_mask = var_4006_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4006_cast_fp16")]; + tensor var_4010_begin_0 = const()[name = tensor("op_4010_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_4010_end_0 = const()[name = tensor("op_4010_end_0"), val = tensor([2, 896, 1, 77])]; + tensor var_4010_end_mask_0 = const()[name = tensor("op_4010_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4010_cast_fp16 = slice_by_index(begin = var_4010_begin_0, end = var_4010_end_0, end_mask = var_4010_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4010_cast_fp16")]; + tensor var_4014_begin_0 = const()[name = tensor("op_4014_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_4014_end_0 = const()[name = tensor("op_4014_end_0"), val = tensor([2, 960, 1, 77])]; + tensor var_4014_end_mask_0 = const()[name = tensor("op_4014_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4014_cast_fp16 = slice_by_index(begin = var_4014_begin_0, end = var_4014_end_0, end_mask = var_4014_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4014_cast_fp16")]; + tensor var_4018_begin_0 = const()[name = tensor("op_4018_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_4018_end_0 = const()[name = tensor("op_4018_end_0"), val = tensor([2, 1024, 1, 77])]; + tensor var_4018_end_mask_0 = const()[name = tensor("op_4018_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4018_cast_fp16 = slice_by_index(begin = var_4018_begin_0, end = var_4018_end_0, end_mask = var_4018_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4018_cast_fp16")]; + tensor var_4022_begin_0 = const()[name = tensor("op_4022_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_4022_end_0 = const()[name = tensor("op_4022_end_0"), val = tensor([2, 1088, 1, 77])]; + tensor var_4022_end_mask_0 = const()[name = tensor("op_4022_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4022_cast_fp16 = slice_by_index(begin = var_4022_begin_0, end = var_4022_end_0, end_mask = var_4022_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4022_cast_fp16")]; + tensor var_4026_begin_0 = const()[name = tensor("op_4026_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_4026_end_0 = const()[name = tensor("op_4026_end_0"), val = tensor([2, 1152, 1, 77])]; + tensor var_4026_end_mask_0 = const()[name = tensor("op_4026_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4026_cast_fp16 = slice_by_index(begin = var_4026_begin_0, end = var_4026_end_0, end_mask = var_4026_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4026_cast_fp16")]; + tensor var_4030_begin_0 = const()[name = tensor("op_4030_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_4030_end_0 = const()[name = tensor("op_4030_end_0"), val = tensor([2, 1216, 1, 77])]; + tensor var_4030_end_mask_0 = const()[name = tensor("op_4030_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4030_cast_fp16 = slice_by_index(begin = var_4030_begin_0, end = var_4030_end_0, end_mask = var_4030_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4030_cast_fp16")]; + tensor var_4034_begin_0 = const()[name = tensor("op_4034_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_4034_end_0 = const()[name = tensor("op_4034_end_0"), val = tensor([2, 1280, 1, 77])]; + tensor var_4034_end_mask_0 = const()[name = tensor("op_4034_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4034_cast_fp16 = slice_by_index(begin = var_4034_begin_0, end = var_4034_end_0, end_mask = var_4034_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4034_cast_fp16")]; + tensor var_4038_equation_0 = const()[name = tensor("op_4038_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4038_cast_fp16 = einsum(equation = var_4038_equation_0, values = (var_3880_cast_fp16, var_3797_cast_fp16))[name = tensor("op_4038_cast_fp16")]; + tensor var_4039_to_fp16 = const()[name = tensor("op_4039_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_241_cast_fp16 = mul(x = var_4038_cast_fp16, y = var_4039_to_fp16)[name = tensor("aw_241_cast_fp16")]; + tensor var_4042_equation_0 = const()[name = tensor("op_4042_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4042_cast_fp16 = einsum(equation = var_4042_equation_0, values = (var_3884_cast_fp16, var_3801_cast_fp16))[name = tensor("op_4042_cast_fp16")]; + tensor var_4043_to_fp16 = const()[name = tensor("op_4043_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_243_cast_fp16 = mul(x = var_4042_cast_fp16, y = var_4043_to_fp16)[name = tensor("aw_243_cast_fp16")]; + tensor var_4046_equation_0 = const()[name = tensor("op_4046_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4046_cast_fp16 = einsum(equation = var_4046_equation_0, values = (var_3888_cast_fp16, var_3805_cast_fp16))[name = tensor("op_4046_cast_fp16")]; + tensor var_4047_to_fp16 = const()[name = tensor("op_4047_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_245_cast_fp16 = mul(x = var_4046_cast_fp16, y = var_4047_to_fp16)[name = tensor("aw_245_cast_fp16")]; + tensor var_4050_equation_0 = const()[name = tensor("op_4050_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4050_cast_fp16 = einsum(equation = var_4050_equation_0, values = (var_3892_cast_fp16, var_3809_cast_fp16))[name = tensor("op_4050_cast_fp16")]; + tensor var_4051_to_fp16 = const()[name = tensor("op_4051_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_247_cast_fp16 = mul(x = var_4050_cast_fp16, y = var_4051_to_fp16)[name = tensor("aw_247_cast_fp16")]; + tensor var_4054_equation_0 = const()[name = tensor("op_4054_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4054_cast_fp16 = einsum(equation = var_4054_equation_0, values = (var_3896_cast_fp16, var_3813_cast_fp16))[name = tensor("op_4054_cast_fp16")]; + tensor var_4055_to_fp16 = const()[name = tensor("op_4055_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_249_cast_fp16 = mul(x = var_4054_cast_fp16, y = var_4055_to_fp16)[name = tensor("aw_249_cast_fp16")]; + tensor var_4058_equation_0 = const()[name = tensor("op_4058_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4058_cast_fp16 = einsum(equation = var_4058_equation_0, values = (var_3900_cast_fp16, var_3817_cast_fp16))[name = tensor("op_4058_cast_fp16")]; + tensor var_4059_to_fp16 = const()[name = tensor("op_4059_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_251_cast_fp16 = mul(x = var_4058_cast_fp16, y = var_4059_to_fp16)[name = tensor("aw_251_cast_fp16")]; + tensor var_4062_equation_0 = const()[name = tensor("op_4062_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4062_cast_fp16 = einsum(equation = var_4062_equation_0, values = (var_3904_cast_fp16, var_3821_cast_fp16))[name = tensor("op_4062_cast_fp16")]; + tensor var_4063_to_fp16 = const()[name = tensor("op_4063_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_253_cast_fp16 = mul(x = var_4062_cast_fp16, y = var_4063_to_fp16)[name = tensor("aw_253_cast_fp16")]; + tensor var_4066_equation_0 = const()[name = tensor("op_4066_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4066_cast_fp16 = einsum(equation = var_4066_equation_0, values = (var_3908_cast_fp16, var_3825_cast_fp16))[name = tensor("op_4066_cast_fp16")]; + tensor var_4067_to_fp16 = const()[name = tensor("op_4067_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_255_cast_fp16 = mul(x = var_4066_cast_fp16, y = var_4067_to_fp16)[name = tensor("aw_255_cast_fp16")]; + tensor var_4070_equation_0 = const()[name = tensor("op_4070_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4070_cast_fp16 = einsum(equation = var_4070_equation_0, values = (var_3912_cast_fp16, var_3829_cast_fp16))[name = tensor("op_4070_cast_fp16")]; + tensor var_4071_to_fp16 = const()[name = tensor("op_4071_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_257_cast_fp16 = mul(x = var_4070_cast_fp16, y = var_4071_to_fp16)[name = tensor("aw_257_cast_fp16")]; + tensor var_4074_equation_0 = const()[name = tensor("op_4074_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4074_cast_fp16 = einsum(equation = var_4074_equation_0, values = (var_3916_cast_fp16, var_3833_cast_fp16))[name = tensor("op_4074_cast_fp16")]; + tensor var_4075_to_fp16 = const()[name = tensor("op_4075_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_259_cast_fp16 = mul(x = var_4074_cast_fp16, y = var_4075_to_fp16)[name = tensor("aw_259_cast_fp16")]; + tensor var_4078_equation_0 = const()[name = tensor("op_4078_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4078_cast_fp16 = einsum(equation = var_4078_equation_0, values = (var_3920_cast_fp16, var_3837_cast_fp16))[name = tensor("op_4078_cast_fp16")]; + tensor var_4079_to_fp16 = const()[name = tensor("op_4079_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_261_cast_fp16 = mul(x = var_4078_cast_fp16, y = var_4079_to_fp16)[name = tensor("aw_261_cast_fp16")]; + tensor var_4082_equation_0 = const()[name = tensor("op_4082_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4082_cast_fp16 = einsum(equation = var_4082_equation_0, values = (var_3924_cast_fp16, var_3841_cast_fp16))[name = tensor("op_4082_cast_fp16")]; + tensor var_4083_to_fp16 = const()[name = tensor("op_4083_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_263_cast_fp16 = mul(x = var_4082_cast_fp16, y = var_4083_to_fp16)[name = tensor("aw_263_cast_fp16")]; + tensor var_4086_equation_0 = const()[name = tensor("op_4086_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4086_cast_fp16 = einsum(equation = var_4086_equation_0, values = (var_3928_cast_fp16, var_3845_cast_fp16))[name = tensor("op_4086_cast_fp16")]; + tensor var_4087_to_fp16 = const()[name = tensor("op_4087_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_265_cast_fp16 = mul(x = var_4086_cast_fp16, y = var_4087_to_fp16)[name = tensor("aw_265_cast_fp16")]; + tensor var_4090_equation_0 = const()[name = tensor("op_4090_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4090_cast_fp16 = einsum(equation = var_4090_equation_0, values = (var_3932_cast_fp16, var_3849_cast_fp16))[name = tensor("op_4090_cast_fp16")]; + tensor var_4091_to_fp16 = const()[name = tensor("op_4091_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_267_cast_fp16 = mul(x = var_4090_cast_fp16, y = var_4091_to_fp16)[name = tensor("aw_267_cast_fp16")]; + tensor var_4094_equation_0 = const()[name = tensor("op_4094_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4094_cast_fp16 = einsum(equation = var_4094_equation_0, values = (var_3936_cast_fp16, var_3853_cast_fp16))[name = tensor("op_4094_cast_fp16")]; + tensor var_4095_to_fp16 = const()[name = tensor("op_4095_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_269_cast_fp16 = mul(x = var_4094_cast_fp16, y = var_4095_to_fp16)[name = tensor("aw_269_cast_fp16")]; + tensor var_4098_equation_0 = const()[name = tensor("op_4098_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4098_cast_fp16 = einsum(equation = var_4098_equation_0, values = (var_3940_cast_fp16, var_3857_cast_fp16))[name = tensor("op_4098_cast_fp16")]; + tensor var_4099_to_fp16 = const()[name = tensor("op_4099_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_271_cast_fp16 = mul(x = var_4098_cast_fp16, y = var_4099_to_fp16)[name = tensor("aw_271_cast_fp16")]; + tensor var_4102_equation_0 = const()[name = tensor("op_4102_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4102_cast_fp16 = einsum(equation = var_4102_equation_0, values = (var_3944_cast_fp16, var_3861_cast_fp16))[name = tensor("op_4102_cast_fp16")]; + tensor var_4103_to_fp16 = const()[name = tensor("op_4103_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_273_cast_fp16 = mul(x = var_4102_cast_fp16, y = var_4103_to_fp16)[name = tensor("aw_273_cast_fp16")]; + tensor var_4106_equation_0 = const()[name = tensor("op_4106_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4106_cast_fp16 = einsum(equation = var_4106_equation_0, values = (var_3948_cast_fp16, var_3865_cast_fp16))[name = tensor("op_4106_cast_fp16")]; + tensor var_4107_to_fp16 = const()[name = tensor("op_4107_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_275_cast_fp16 = mul(x = var_4106_cast_fp16, y = var_4107_to_fp16)[name = tensor("aw_275_cast_fp16")]; + tensor var_4110_equation_0 = const()[name = tensor("op_4110_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4110_cast_fp16 = einsum(equation = var_4110_equation_0, values = (var_3952_cast_fp16, var_3869_cast_fp16))[name = tensor("op_4110_cast_fp16")]; + tensor var_4111_to_fp16 = const()[name = tensor("op_4111_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_277_cast_fp16 = mul(x = var_4110_cast_fp16, y = var_4111_to_fp16)[name = tensor("aw_277_cast_fp16")]; + tensor var_4114_equation_0 = const()[name = tensor("op_4114_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4114_cast_fp16 = einsum(equation = var_4114_equation_0, values = (var_3956_cast_fp16, var_3873_cast_fp16))[name = tensor("op_4114_cast_fp16")]; + tensor var_4115_to_fp16 = const()[name = tensor("op_4115_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_279_cast_fp16 = mul(x = var_4114_cast_fp16, y = var_4115_to_fp16)[name = tensor("aw_279_cast_fp16")]; + tensor var_4117_cast_fp16 = softmax(axis = var_2254, x = aw_241_cast_fp16)[name = tensor("op_4117_cast_fp16")]; + tensor var_4118_cast_fp16 = softmax(axis = var_2254, x = aw_243_cast_fp16)[name = tensor("op_4118_cast_fp16")]; + tensor var_4119_cast_fp16 = softmax(axis = var_2254, x = aw_245_cast_fp16)[name = tensor("op_4119_cast_fp16")]; + tensor var_4120_cast_fp16 = softmax(axis = var_2254, x = aw_247_cast_fp16)[name = tensor("op_4120_cast_fp16")]; + tensor var_4121_cast_fp16 = softmax(axis = var_2254, x = aw_249_cast_fp16)[name = tensor("op_4121_cast_fp16")]; + tensor var_4122_cast_fp16 = softmax(axis = var_2254, x = aw_251_cast_fp16)[name = tensor("op_4122_cast_fp16")]; + tensor var_4123_cast_fp16 = softmax(axis = var_2254, x = aw_253_cast_fp16)[name = tensor("op_4123_cast_fp16")]; + tensor var_4124_cast_fp16 = softmax(axis = var_2254, x = aw_255_cast_fp16)[name = tensor("op_4124_cast_fp16")]; + tensor var_4125_cast_fp16 = softmax(axis = var_2254, x = aw_257_cast_fp16)[name = tensor("op_4125_cast_fp16")]; + tensor var_4126_cast_fp16 = softmax(axis = var_2254, x = aw_259_cast_fp16)[name = tensor("op_4126_cast_fp16")]; + tensor var_4127_cast_fp16 = softmax(axis = var_2254, x = aw_261_cast_fp16)[name = tensor("op_4127_cast_fp16")]; + tensor var_4128_cast_fp16 = softmax(axis = var_2254, x = aw_263_cast_fp16)[name = tensor("op_4128_cast_fp16")]; + tensor var_4129_cast_fp16 = softmax(axis = var_2254, x = aw_265_cast_fp16)[name = tensor("op_4129_cast_fp16")]; + tensor var_4130_cast_fp16 = softmax(axis = var_2254, x = aw_267_cast_fp16)[name = tensor("op_4130_cast_fp16")]; + tensor var_4131_cast_fp16 = softmax(axis = var_2254, x = aw_269_cast_fp16)[name = tensor("op_4131_cast_fp16")]; + tensor var_4132_cast_fp16 = softmax(axis = var_2254, x = aw_271_cast_fp16)[name = tensor("op_4132_cast_fp16")]; + tensor var_4133_cast_fp16 = softmax(axis = var_2254, x = aw_273_cast_fp16)[name = tensor("op_4133_cast_fp16")]; + tensor var_4134_cast_fp16 = softmax(axis = var_2254, x = aw_275_cast_fp16)[name = tensor("op_4134_cast_fp16")]; + tensor var_4135_cast_fp16 = softmax(axis = var_2254, x = aw_277_cast_fp16)[name = tensor("op_4135_cast_fp16")]; + tensor var_4136_cast_fp16 = softmax(axis = var_2254, x = aw_279_cast_fp16)[name = tensor("op_4136_cast_fp16")]; + tensor var_4138_equation_0 = const()[name = tensor("op_4138_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4138_cast_fp16 = einsum(equation = var_4138_equation_0, values = (var_3958_cast_fp16, var_4117_cast_fp16))[name = tensor("op_4138_cast_fp16")]; + tensor var_4140_equation_0 = const()[name = tensor("op_4140_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4140_cast_fp16 = einsum(equation = var_4140_equation_0, values = (var_3962_cast_fp16, var_4118_cast_fp16))[name = tensor("op_4140_cast_fp16")]; + tensor var_4142_equation_0 = const()[name = tensor("op_4142_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4142_cast_fp16 = einsum(equation = var_4142_equation_0, values = (var_3966_cast_fp16, var_4119_cast_fp16))[name = tensor("op_4142_cast_fp16")]; + tensor var_4144_equation_0 = const()[name = tensor("op_4144_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4144_cast_fp16 = einsum(equation = var_4144_equation_0, values = (var_3970_cast_fp16, var_4120_cast_fp16))[name = tensor("op_4144_cast_fp16")]; + tensor var_4146_equation_0 = const()[name = tensor("op_4146_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4146_cast_fp16 = einsum(equation = var_4146_equation_0, values = (var_3974_cast_fp16, var_4121_cast_fp16))[name = tensor("op_4146_cast_fp16")]; + tensor var_4148_equation_0 = const()[name = tensor("op_4148_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4148_cast_fp16 = einsum(equation = var_4148_equation_0, values = (var_3978_cast_fp16, var_4122_cast_fp16))[name = tensor("op_4148_cast_fp16")]; + tensor var_4150_equation_0 = const()[name = tensor("op_4150_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4150_cast_fp16 = einsum(equation = var_4150_equation_0, values = (var_3982_cast_fp16, var_4123_cast_fp16))[name = tensor("op_4150_cast_fp16")]; + tensor var_4152_equation_0 = const()[name = tensor("op_4152_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4152_cast_fp16 = einsum(equation = var_4152_equation_0, values = (var_3986_cast_fp16, var_4124_cast_fp16))[name = tensor("op_4152_cast_fp16")]; + tensor var_4154_equation_0 = const()[name = tensor("op_4154_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4154_cast_fp16 = einsum(equation = var_4154_equation_0, values = (var_3990_cast_fp16, var_4125_cast_fp16))[name = tensor("op_4154_cast_fp16")]; + tensor var_4156_equation_0 = const()[name = tensor("op_4156_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4156_cast_fp16 = einsum(equation = var_4156_equation_0, values = (var_3994_cast_fp16, var_4126_cast_fp16))[name = tensor("op_4156_cast_fp16")]; + tensor var_4158_equation_0 = const()[name = tensor("op_4158_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4158_cast_fp16 = einsum(equation = var_4158_equation_0, values = (var_3998_cast_fp16, var_4127_cast_fp16))[name = tensor("op_4158_cast_fp16")]; + tensor var_4160_equation_0 = const()[name = tensor("op_4160_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4160_cast_fp16 = einsum(equation = var_4160_equation_0, values = (var_4002_cast_fp16, var_4128_cast_fp16))[name = tensor("op_4160_cast_fp16")]; + tensor var_4162_equation_0 = const()[name = tensor("op_4162_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4162_cast_fp16 = einsum(equation = var_4162_equation_0, values = (var_4006_cast_fp16, var_4129_cast_fp16))[name = tensor("op_4162_cast_fp16")]; + tensor var_4164_equation_0 = const()[name = tensor("op_4164_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4164_cast_fp16 = einsum(equation = var_4164_equation_0, values = (var_4010_cast_fp16, var_4130_cast_fp16))[name = tensor("op_4164_cast_fp16")]; + tensor var_4166_equation_0 = const()[name = tensor("op_4166_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4166_cast_fp16 = einsum(equation = var_4166_equation_0, values = (var_4014_cast_fp16, var_4131_cast_fp16))[name = tensor("op_4166_cast_fp16")]; + tensor var_4168_equation_0 = const()[name = tensor("op_4168_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4168_cast_fp16 = einsum(equation = var_4168_equation_0, values = (var_4018_cast_fp16, var_4132_cast_fp16))[name = tensor("op_4168_cast_fp16")]; + tensor var_4170_equation_0 = const()[name = tensor("op_4170_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4170_cast_fp16 = einsum(equation = var_4170_equation_0, values = (var_4022_cast_fp16, var_4133_cast_fp16))[name = tensor("op_4170_cast_fp16")]; + tensor var_4172_equation_0 = const()[name = tensor("op_4172_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4172_cast_fp16 = einsum(equation = var_4172_equation_0, values = (var_4026_cast_fp16, var_4134_cast_fp16))[name = tensor("op_4172_cast_fp16")]; + tensor var_4174_equation_0 = const()[name = tensor("op_4174_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4174_cast_fp16 = einsum(equation = var_4174_equation_0, values = (var_4030_cast_fp16, var_4135_cast_fp16))[name = tensor("op_4174_cast_fp16")]; + tensor var_4176_equation_0 = const()[name = tensor("op_4176_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4176_cast_fp16 = einsum(equation = var_4176_equation_0, values = (var_4034_cast_fp16, var_4136_cast_fp16))[name = tensor("op_4176_cast_fp16")]; + tensor input_161_interleave_0 = const()[name = tensor("input_161_interleave_0"), val = tensor(false)]; + tensor input_161_cast_fp16 = concat(axis = var_2254, interleave = input_161_interleave_0, values = (var_4138_cast_fp16, var_4140_cast_fp16, var_4142_cast_fp16, var_4144_cast_fp16, var_4146_cast_fp16, var_4148_cast_fp16, var_4150_cast_fp16, var_4152_cast_fp16, var_4154_cast_fp16, var_4156_cast_fp16, var_4158_cast_fp16, var_4160_cast_fp16, var_4162_cast_fp16, var_4164_cast_fp16, var_4166_cast_fp16, var_4168_cast_fp16, var_4170_cast_fp16, var_4172_cast_fp16, var_4174_cast_fp16, var_4176_cast_fp16))[name = tensor("input_161_cast_fp16")]; + tensor var_4182 = const()[name = tensor("op_4182"), val = tensor([1, 1])]; + tensor var_4184 = const()[name = tensor("op_4184"), val = tensor([1, 1])]; + tensor var_4186_pad_type_0 = const()[name = tensor("op_4186_pad_type_0"), val = tensor("custom")]; + tensor var_4186_pad_0 = const()[name = tensor("op_4186_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(308004672)))]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(311281536)))]; + tensor var_4186_cast_fp16 = conv(bias = down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_4184, groups = var_2254, pad = var_4186_pad_0, pad_type = var_4186_pad_type_0, strides = var_4182, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_161_cast_fp16)[name = tensor("op_4186_cast_fp16")]; + tensor inputs_35_cast_fp16 = add(x = var_4186_cast_fp16, y = inputs_33_cast_fp16)[name = tensor("inputs_35_cast_fp16")]; + tensor var_4190 = const()[name = tensor("op_4190"), val = tensor([1])]; + tensor channels_mean_35_cast_fp16 = reduce_mean(axes = var_4190, keep_dims = var_2249, x = inputs_35_cast_fp16)[name = tensor("channels_mean_35_cast_fp16")]; + tensor zero_mean_35_cast_fp16 = sub(x = inputs_35_cast_fp16, y = channels_mean_35_cast_fp16)[name = tensor("zero_mean_35_cast_fp16")]; + tensor zero_mean_sq_35_cast_fp16 = mul(x = zero_mean_35_cast_fp16, y = zero_mean_35_cast_fp16)[name = tensor("zero_mean_sq_35_cast_fp16")]; + tensor var_4194 = const()[name = tensor("op_4194"), val = tensor([1])]; + tensor var_4195_cast_fp16 = reduce_mean(axes = var_4194, keep_dims = var_2249, x = zero_mean_sq_35_cast_fp16)[name = tensor("op_4195_cast_fp16")]; + tensor var_4196_to_fp16 = const()[name = tensor("op_4196_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_4197_cast_fp16 = add(x = var_4195_cast_fp16, y = var_4196_to_fp16)[name = tensor("op_4197_cast_fp16")]; + tensor denom_35_epsilon_0_to_fp16 = const()[name = tensor("denom_35_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_35_cast_fp16 = rsqrt(epsilon = denom_35_epsilon_0_to_fp16, x = var_4197_cast_fp16)[name = tensor("denom_35_cast_fp16")]; + tensor out_35_cast_fp16 = mul(x = zero_mean_35_cast_fp16, y = denom_35_cast_fp16)[name = tensor("out_35_cast_fp16")]; + tensor var_4201_to_fp16 = const()[name = tensor("op_4201_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(311284160)))]; + tensor var_4202_cast_fp16 = add(x = out_35_cast_fp16, y = var_4201_to_fp16)[name = tensor("op_4202_cast_fp16")]; + tensor var_4204_to_fp16 = const()[name = tensor("op_4204_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(311286784)))]; + tensor input_163_cast_fp16 = mul(x = var_4202_cast_fp16, y = var_4204_to_fp16)[name = tensor("input_163_cast_fp16")]; + tensor var_4212 = const()[name = tensor("op_4212"), val = tensor([1, 1])]; + tensor var_4214 = const()[name = tensor("op_4214"), val = tensor([1, 1])]; + tensor var_4216_pad_type_0 = const()[name = tensor("op_4216_pad_type_0"), val = tensor("custom")]; + tensor var_4216_pad_0 = const()[name = tensor("op_4216_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(311289408)))]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337503872)))]; + tensor var_4216_cast_fp16 = conv(bias = down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_4214, groups = var_2254, pad = var_4216_pad_0, pad_type = var_4216_pad_type_0, strides = var_4212, weight = down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_163_cast_fp16)[name = tensor("op_4216_cast_fp16")]; + tensor var_4217_split_sizes_0 = const()[name = tensor("op_4217_split_sizes_0"), val = tensor([5120, 5120])]; + tensor var_4217_axis_0 = const()[name = tensor("op_4217_axis_0"), val = tensor(1)]; + tensor var_4217_cast_fp16_0, tensor var_4217_cast_fp16_1 = split(axis = var_4217_axis_0, split_sizes = var_4217_split_sizes_0, x = var_4216_cast_fp16)[name = tensor("op_4217_cast_fp16")]; + tensor var_4219_mode_0 = const()[name = tensor("op_4219_mode_0"), val = tensor("EXACT")]; + tensor var_4219_cast_fp16 = gelu(mode = var_4219_mode_0, x = var_4217_cast_fp16_1)[name = tensor("op_4219_cast_fp16")]; + tensor input_165_cast_fp16 = mul(x = var_4217_cast_fp16_0, y = var_4219_cast_fp16)[name = tensor("input_165_cast_fp16")]; + tensor var_4223 = const()[name = tensor("op_4223"), val = tensor([1, 1])]; + tensor var_4225 = const()[name = tensor("op_4225"), val = tensor([1, 1])]; + tensor var_4227_pad_type_0 = const()[name = tensor("op_4227_pad_type_0"), val = tensor("custom")]; + tensor var_4227_pad_0 = const()[name = tensor("op_4227_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337524416)))]; + tensor down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350631680)))]; + tensor var_4227_cast_fp16 = conv(bias = down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_4225, groups = var_2254, pad = var_4227_pad_0, pad_type = var_4227_pad_type_0, strides = var_4223, weight = down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_165_cast_fp16)[name = tensor("op_4227_cast_fp16")]; + tensor hidden_states_105_cast_fp16 = add(x = var_4227_cast_fp16, y = inputs_35_cast_fp16)[name = tensor("hidden_states_105_cast_fp16")]; + tensor var_4229 = const()[name = tensor("op_4229"), val = tensor([2, 1280, 12, 12])]; + tensor input_167_cast_fp16 = reshape(shape = var_4229, x = hidden_states_105_cast_fp16)[name = tensor("input_167_cast_fp16")]; + tensor var_4233 = const()[name = tensor("op_4233"), val = tensor([1, 1])]; + tensor var_4235 = const()[name = tensor("op_4235"), val = tensor([1, 1])]; + tensor hidden_states_107_pad_type_0 = const()[name = tensor("hidden_states_107_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_107_pad_0 = const()[name = tensor("hidden_states_107_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_2_attentions_1_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350634304)))]; + tensor down_blocks_2_attentions_1_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(353911168)))]; + tensor hidden_states_107_cast_fp16 = conv(bias = down_blocks_2_attentions_1_proj_out_bias_to_fp16, dilations = var_4235, groups = var_2254, pad = hidden_states_107_pad_0, pad_type = hidden_states_107_pad_type_0, strides = var_4233, weight = down_blocks_2_attentions_1_proj_out_weight_to_fp16, x = input_167_cast_fp16)[name = tensor("hidden_states_107_cast_fp16")]; + tensor input_169_cast_fp16 = add(x = hidden_states_107_cast_fp16, y = hidden_states_95_cast_fp16)[name = tensor("input_169_cast_fp16")]; + tensor var_4242 = const()[name = tensor("op_4242"), val = tensor([2, 2])]; + tensor var_4244 = const()[name = tensor("op_4244"), val = tensor([1, 1])]; + tensor input_171_pad_type_0 = const()[name = tensor("input_171_pad_type_0"), val = tensor("custom")]; + tensor input_171_pad_0 = const()[name = tensor("input_171_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_2_downsamplers_0_conv_weight_to_fp16 = const()[name = tensor("down_blocks_2_downsamplers_0_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(353913792)))]; + tensor down_blocks_2_downsamplers_0_conv_bias_to_fp16 = const()[name = tensor("down_blocks_2_downsamplers_0_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(383405056)))]; + tensor input_171_cast_fp16 = conv(bias = down_blocks_2_downsamplers_0_conv_bias_to_fp16, dilations = var_4244, groups = var_2254, pad = input_171_pad_0, pad_type = input_171_pad_type_0, strides = var_4242, weight = down_blocks_2_downsamplers_0_conv_weight_to_fp16, x = input_169_cast_fp16)[name = tensor("input_171_cast_fp16")]; + tensor var_4256 = const()[name = tensor("op_4256"), val = tensor(1)]; + tensor reshape_72_shape_0 = const()[name = tensor("reshape_72_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_72_cast_fp16 = reshape(shape = reshape_72_shape_0, x = input_171_cast_fp16)[name = tensor("reshape_72_cast_fp16")]; + tensor reduce_mean_54_axes_0 = const()[name = tensor("reduce_mean_54_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_54_keep_dims_0 = const()[name = tensor("reduce_mean_54_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_54_cast_fp16 = reduce_mean(axes = reduce_mean_54_axes_0, keep_dims = reduce_mean_54_keep_dims_0, x = reshape_72_cast_fp16)[name = tensor("reduce_mean_54_cast_fp16")]; + tensor sub_36_cast_fp16 = sub(x = reshape_72_cast_fp16, y = reduce_mean_54_cast_fp16)[name = tensor("sub_36_cast_fp16")]; + tensor square_18_cast_fp16 = square(x = sub_36_cast_fp16)[name = tensor("square_18_cast_fp16")]; + tensor reduce_mean_56_axes_0 = const()[name = tensor("reduce_mean_56_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_56_keep_dims_0 = const()[name = tensor("reduce_mean_56_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_56_cast_fp16 = reduce_mean(axes = reduce_mean_56_axes_0, keep_dims = reduce_mean_56_keep_dims_0, x = square_18_cast_fp16)[name = tensor("reduce_mean_56_cast_fp16")]; + tensor add_36_y_0_to_fp16 = const()[name = tensor("add_36_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_36_cast_fp16 = add(x = reduce_mean_56_cast_fp16, y = add_36_y_0_to_fp16)[name = tensor("add_36_cast_fp16")]; + tensor sqrt_18_cast_fp16 = sqrt(x = add_36_cast_fp16)[name = tensor("sqrt_18_cast_fp16")]; + tensor real_div_18_cast_fp16 = real_div(x = sub_36_cast_fp16, y = sqrt_18_cast_fp16)[name = tensor("real_div_18_cast_fp16")]; + tensor reshape_73_shape_0 = const()[name = tensor("reshape_73_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_73_cast_fp16 = reshape(shape = reshape_73_shape_0, x = real_div_18_cast_fp16)[name = tensor("reshape_73_cast_fp16")]; + tensor add_37_gamma_0_to_fp16 = const()[name = tensor("add_37_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(383407680)))]; + tensor add_37_beta_0_to_fp16 = const()[name = tensor("add_37_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(383410304)))]; + tensor add_37_epsilon_0_to_fp16 = const()[name = tensor("add_37_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_37_cast_fp16 = batch_norm(beta = add_37_beta_0_to_fp16, epsilon = add_37_epsilon_0_to_fp16, gamma = add_37_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_73_cast_fp16)[name = tensor("add_37_cast_fp16")]; + tensor input_175_cast_fp16 = silu(x = add_37_cast_fp16)[name = tensor("input_175_cast_fp16")]; + tensor var_4272 = const()[name = tensor("op_4272"), val = tensor([1, 1])]; + tensor var_4274 = const()[name = tensor("op_4274"), val = tensor([1, 1])]; + tensor hidden_states_109_pad_type_0 = const()[name = tensor("hidden_states_109_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_109_pad_0 = const()[name = tensor("hidden_states_109_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_3_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(383412928)))]; + tensor down_blocks_3_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412904192)))]; + tensor hidden_states_109_cast_fp16 = conv(bias = down_blocks_3_resnets_0_conv1_bias_to_fp16, dilations = var_4274, groups = var_4256, pad = hidden_states_109_pad_0, pad_type = hidden_states_109_pad_type_0, strides = var_4272, weight = down_blocks_3_resnets_0_conv1_weight_to_fp16, x = input_175_cast_fp16)[name = tensor("hidden_states_109_cast_fp16")]; + tensor var_4280 = const()[name = tensor("op_4280"), val = tensor([1, 1])]; + tensor var_4282 = const()[name = tensor("op_4282"), val = tensor([1, 1])]; + tensor temb_13_pad_type_0 = const()[name = tensor("temb_13_pad_type_0"), val = tensor("custom")]; + tensor temb_13_pad_0 = const()[name = tensor("temb_13_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_3_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412906816)))]; + tensor down_blocks_3_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416183680)))]; + tensor temb_13_cast_fp16 = conv(bias = down_blocks_3_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_4282, groups = var_4256, pad = temb_13_pad_0, pad_type = temb_13_pad_type_0, strides = var_4280, weight = down_blocks_3_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_13_cast_fp16")]; + tensor input_179_cast_fp16 = add(x = hidden_states_109_cast_fp16, y = temb_13_cast_fp16)[name = tensor("input_179_cast_fp16")]; + tensor reshape_76_shape_0 = const()[name = tensor("reshape_76_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_76_cast_fp16 = reshape(shape = reshape_76_shape_0, x = input_179_cast_fp16)[name = tensor("reshape_76_cast_fp16")]; + tensor reduce_mean_57_axes_0 = const()[name = tensor("reduce_mean_57_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_57_keep_dims_0 = const()[name = tensor("reduce_mean_57_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_57_cast_fp16 = reduce_mean(axes = reduce_mean_57_axes_0, keep_dims = reduce_mean_57_keep_dims_0, x = reshape_76_cast_fp16)[name = tensor("reduce_mean_57_cast_fp16")]; + tensor sub_38_cast_fp16 = sub(x = reshape_76_cast_fp16, y = reduce_mean_57_cast_fp16)[name = tensor("sub_38_cast_fp16")]; + tensor square_19_cast_fp16 = square(x = sub_38_cast_fp16)[name = tensor("square_19_cast_fp16")]; + tensor reduce_mean_59_axes_0 = const()[name = tensor("reduce_mean_59_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_59_keep_dims_0 = const()[name = tensor("reduce_mean_59_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_59_cast_fp16 = reduce_mean(axes = reduce_mean_59_axes_0, keep_dims = reduce_mean_59_keep_dims_0, x = square_19_cast_fp16)[name = tensor("reduce_mean_59_cast_fp16")]; + tensor add_38_y_0_to_fp16 = const()[name = tensor("add_38_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_38_cast_fp16 = add(x = reduce_mean_59_cast_fp16, y = add_38_y_0_to_fp16)[name = tensor("add_38_cast_fp16")]; + tensor sqrt_19_cast_fp16 = sqrt(x = add_38_cast_fp16)[name = tensor("sqrt_19_cast_fp16")]; + tensor real_div_19_cast_fp16 = real_div(x = sub_38_cast_fp16, y = sqrt_19_cast_fp16)[name = tensor("real_div_19_cast_fp16")]; + tensor reshape_77_shape_0 = const()[name = tensor("reshape_77_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_77_cast_fp16 = reshape(shape = reshape_77_shape_0, x = real_div_19_cast_fp16)[name = tensor("reshape_77_cast_fp16")]; + tensor add_39_gamma_0_to_fp16 = const()[name = tensor("add_39_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416186304)))]; + tensor add_39_beta_0_to_fp16 = const()[name = tensor("add_39_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416188928)))]; + tensor add_39_epsilon_0_to_fp16 = const()[name = tensor("add_39_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_39_cast_fp16 = batch_norm(beta = add_39_beta_0_to_fp16, epsilon = add_39_epsilon_0_to_fp16, gamma = add_39_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_77_cast_fp16)[name = tensor("add_39_cast_fp16")]; + tensor input_183_cast_fp16 = silu(x = add_39_cast_fp16)[name = tensor("input_183_cast_fp16")]; + tensor var_4292 = const()[name = tensor("op_4292"), val = tensor([1, 1])]; + tensor var_4294 = const()[name = tensor("op_4294"), val = tensor([1, 1])]; + tensor hidden_states_111_pad_type_0 = const()[name = tensor("hidden_states_111_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_111_pad_0 = const()[name = tensor("hidden_states_111_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_3_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416191552)))]; + tensor down_blocks_3_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445682816)))]; + tensor hidden_states_111_cast_fp16 = conv(bias = down_blocks_3_resnets_0_conv2_bias_to_fp16, dilations = var_4294, groups = var_4256, pad = hidden_states_111_pad_0, pad_type = hidden_states_111_pad_type_0, strides = var_4292, weight = down_blocks_3_resnets_0_conv2_weight_to_fp16, x = input_183_cast_fp16)[name = tensor("hidden_states_111_cast_fp16")]; + tensor input_185_cast_fp16 = add(x = input_171_cast_fp16, y = hidden_states_111_cast_fp16)[name = tensor("input_185_cast_fp16")]; + tensor reshape_80_shape_0 = const()[name = tensor("reshape_80_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_80_cast_fp16 = reshape(shape = reshape_80_shape_0, x = input_185_cast_fp16)[name = tensor("reshape_80_cast_fp16")]; + tensor reduce_mean_60_axes_0 = const()[name = tensor("reduce_mean_60_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_60_keep_dims_0 = const()[name = tensor("reduce_mean_60_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_60_cast_fp16 = reduce_mean(axes = reduce_mean_60_axes_0, keep_dims = reduce_mean_60_keep_dims_0, x = reshape_80_cast_fp16)[name = tensor("reduce_mean_60_cast_fp16")]; + tensor sub_40_cast_fp16 = sub(x = reshape_80_cast_fp16, y = reduce_mean_60_cast_fp16)[name = tensor("sub_40_cast_fp16")]; + tensor square_20_cast_fp16 = square(x = sub_40_cast_fp16)[name = tensor("square_20_cast_fp16")]; + tensor reduce_mean_62_axes_0 = const()[name = tensor("reduce_mean_62_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_62_keep_dims_0 = const()[name = tensor("reduce_mean_62_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_62_cast_fp16 = reduce_mean(axes = reduce_mean_62_axes_0, keep_dims = reduce_mean_62_keep_dims_0, x = square_20_cast_fp16)[name = tensor("reduce_mean_62_cast_fp16")]; + tensor add_40_y_0_to_fp16 = const()[name = tensor("add_40_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_40_cast_fp16 = add(x = reduce_mean_62_cast_fp16, y = add_40_y_0_to_fp16)[name = tensor("add_40_cast_fp16")]; + tensor sqrt_20_cast_fp16 = sqrt(x = add_40_cast_fp16)[name = tensor("sqrt_20_cast_fp16")]; + tensor real_div_20_cast_fp16 = real_div(x = sub_40_cast_fp16, y = sqrt_20_cast_fp16)[name = tensor("real_div_20_cast_fp16")]; + tensor reshape_81_shape_0 = const()[name = tensor("reshape_81_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_81_cast_fp16 = reshape(shape = reshape_81_shape_0, x = real_div_20_cast_fp16)[name = tensor("reshape_81_cast_fp16")]; + tensor add_41_gamma_0_to_fp16 = const()[name = tensor("add_41_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445685440)))]; + tensor add_41_beta_0_to_fp16 = const()[name = tensor("add_41_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445688064)))]; + tensor add_41_epsilon_0_to_fp16 = const()[name = tensor("add_41_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_41_cast_fp16 = batch_norm(beta = add_41_beta_0_to_fp16, epsilon = add_41_epsilon_0_to_fp16, gamma = add_41_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_81_cast_fp16)[name = tensor("add_41_cast_fp16")]; + tensor input_189_cast_fp16 = silu(x = add_41_cast_fp16)[name = tensor("input_189_cast_fp16")]; + tensor var_4309 = const()[name = tensor("op_4309"), val = tensor([1, 1])]; + tensor var_4311 = const()[name = tensor("op_4311"), val = tensor([1, 1])]; + tensor hidden_states_113_pad_type_0 = const()[name = tensor("hidden_states_113_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_113_pad_0 = const()[name = tensor("hidden_states_113_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_3_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445690688)))]; + tensor down_blocks_3_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(475181952)))]; + tensor hidden_states_113_cast_fp16 = conv(bias = down_blocks_3_resnets_1_conv1_bias_to_fp16, dilations = var_4311, groups = var_4256, pad = hidden_states_113_pad_0, pad_type = hidden_states_113_pad_type_0, strides = var_4309, weight = down_blocks_3_resnets_1_conv1_weight_to_fp16, x = input_189_cast_fp16)[name = tensor("hidden_states_113_cast_fp16")]; + tensor var_4317 = const()[name = tensor("op_4317"), val = tensor([1, 1])]; + tensor var_4319 = const()[name = tensor("op_4319"), val = tensor([1, 1])]; + tensor temb_15_pad_type_0 = const()[name = tensor("temb_15_pad_type_0"), val = tensor("custom")]; + tensor temb_15_pad_0 = const()[name = tensor("temb_15_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor down_blocks_3_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(475184576)))]; + tensor down_blocks_3_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478461440)))]; + tensor temb_15_cast_fp16 = conv(bias = down_blocks_3_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_4319, groups = var_4256, pad = temb_15_pad_0, pad_type = temb_15_pad_type_0, strides = var_4317, weight = down_blocks_3_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_15_cast_fp16")]; + tensor input_193_cast_fp16 = add(x = hidden_states_113_cast_fp16, y = temb_15_cast_fp16)[name = tensor("input_193_cast_fp16")]; + tensor reshape_84_shape_0 = const()[name = tensor("reshape_84_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_84_cast_fp16 = reshape(shape = reshape_84_shape_0, x = input_193_cast_fp16)[name = tensor("reshape_84_cast_fp16")]; + tensor reduce_mean_63_axes_0 = const()[name = tensor("reduce_mean_63_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_63_keep_dims_0 = const()[name = tensor("reduce_mean_63_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_63_cast_fp16 = reduce_mean(axes = reduce_mean_63_axes_0, keep_dims = reduce_mean_63_keep_dims_0, x = reshape_84_cast_fp16)[name = tensor("reduce_mean_63_cast_fp16")]; + tensor sub_42_cast_fp16 = sub(x = reshape_84_cast_fp16, y = reduce_mean_63_cast_fp16)[name = tensor("sub_42_cast_fp16")]; + tensor square_21_cast_fp16 = square(x = sub_42_cast_fp16)[name = tensor("square_21_cast_fp16")]; + tensor reduce_mean_65_axes_0 = const()[name = tensor("reduce_mean_65_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_65_keep_dims_0 = const()[name = tensor("reduce_mean_65_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_65_cast_fp16 = reduce_mean(axes = reduce_mean_65_axes_0, keep_dims = reduce_mean_65_keep_dims_0, x = square_21_cast_fp16)[name = tensor("reduce_mean_65_cast_fp16")]; + tensor add_42_y_0_to_fp16 = const()[name = tensor("add_42_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_42_cast_fp16 = add(x = reduce_mean_65_cast_fp16, y = add_42_y_0_to_fp16)[name = tensor("add_42_cast_fp16")]; + tensor sqrt_21_cast_fp16 = sqrt(x = add_42_cast_fp16)[name = tensor("sqrt_21_cast_fp16")]; + tensor real_div_21_cast_fp16 = real_div(x = sub_42_cast_fp16, y = sqrt_21_cast_fp16)[name = tensor("real_div_21_cast_fp16")]; + tensor reshape_85_shape_0 = const()[name = tensor("reshape_85_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_85_cast_fp16 = reshape(shape = reshape_85_shape_0, x = real_div_21_cast_fp16)[name = tensor("reshape_85_cast_fp16")]; + tensor add_43_gamma_0_to_fp16 = const()[name = tensor("add_43_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478464064)))]; + tensor add_43_beta_0_to_fp16 = const()[name = tensor("add_43_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478466688)))]; + tensor add_43_epsilon_0_to_fp16 = const()[name = tensor("add_43_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_43_cast_fp16 = batch_norm(beta = add_43_beta_0_to_fp16, epsilon = add_43_epsilon_0_to_fp16, gamma = add_43_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_85_cast_fp16)[name = tensor("add_43_cast_fp16")]; + tensor input_197_cast_fp16 = silu(x = add_43_cast_fp16)[name = tensor("input_197_cast_fp16")]; + tensor var_4329 = const()[name = tensor("op_4329"), val = tensor([1, 1])]; + tensor var_4331 = const()[name = tensor("op_4331"), val = tensor([1, 1])]; + tensor hidden_states_115_pad_type_0 = const()[name = tensor("hidden_states_115_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_115_pad_0 = const()[name = tensor("hidden_states_115_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor down_blocks_3_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478469312)))]; + tensor down_blocks_3_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(507960576)))]; + tensor hidden_states_115_cast_fp16 = conv(bias = down_blocks_3_resnets_1_conv2_bias_to_fp16, dilations = var_4331, groups = var_4256, pad = hidden_states_115_pad_0, pad_type = hidden_states_115_pad_type_0, strides = var_4329, weight = down_blocks_3_resnets_1_conv2_weight_to_fp16, x = input_197_cast_fp16)[name = tensor("hidden_states_115_cast_fp16")]; + tensor input_199_cast_fp16 = add(x = input_185_cast_fp16, y = hidden_states_115_cast_fp16)[name = tensor("input_199_cast_fp16")]; + tensor var_4366 = const()[name = tensor("op_4366"), val = tensor(true)]; + tensor var_4371 = const()[name = tensor("op_4371"), val = tensor(1)]; + tensor reshape_88_shape_0 = const()[name = tensor("reshape_88_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_88_cast_fp16 = reshape(shape = reshape_88_shape_0, x = input_199_cast_fp16)[name = tensor("reshape_88_cast_fp16")]; + tensor reduce_mean_66_axes_0 = const()[name = tensor("reduce_mean_66_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_66_keep_dims_0 = const()[name = tensor("reduce_mean_66_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_66_cast_fp16 = reduce_mean(axes = reduce_mean_66_axes_0, keep_dims = reduce_mean_66_keep_dims_0, x = reshape_88_cast_fp16)[name = tensor("reduce_mean_66_cast_fp16")]; + tensor sub_44_cast_fp16 = sub(x = reshape_88_cast_fp16, y = reduce_mean_66_cast_fp16)[name = tensor("sub_44_cast_fp16")]; + tensor square_22_cast_fp16 = square(x = sub_44_cast_fp16)[name = tensor("square_22_cast_fp16")]; + tensor reduce_mean_68_axes_0 = const()[name = tensor("reduce_mean_68_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_68_keep_dims_0 = const()[name = tensor("reduce_mean_68_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_68_cast_fp16 = reduce_mean(axes = reduce_mean_68_axes_0, keep_dims = reduce_mean_68_keep_dims_0, x = square_22_cast_fp16)[name = tensor("reduce_mean_68_cast_fp16")]; + tensor add_44_y_0_to_fp16 = const()[name = tensor("add_44_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_44_cast_fp16 = add(x = reduce_mean_68_cast_fp16, y = add_44_y_0_to_fp16)[name = tensor("add_44_cast_fp16")]; + tensor sqrt_22_cast_fp16 = sqrt(x = add_44_cast_fp16)[name = tensor("sqrt_22_cast_fp16")]; + tensor real_div_22_cast_fp16 = real_div(x = sub_44_cast_fp16, y = sqrt_22_cast_fp16)[name = tensor("real_div_22_cast_fp16")]; + tensor reshape_89_shape_0 = const()[name = tensor("reshape_89_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_89_cast_fp16 = reshape(shape = reshape_89_shape_0, x = real_div_22_cast_fp16)[name = tensor("reshape_89_cast_fp16")]; + tensor add_45_gamma_0_to_fp16 = const()[name = tensor("add_45_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(507963200)))]; + tensor add_45_beta_0_to_fp16 = const()[name = tensor("add_45_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(507965824)))]; + tensor add_45_epsilon_0_to_fp16 = const()[name = tensor("add_45_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_45_cast_fp16 = batch_norm(beta = add_45_beta_0_to_fp16, epsilon = add_45_epsilon_0_to_fp16, gamma = add_45_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_89_cast_fp16)[name = tensor("add_45_cast_fp16")]; + tensor input_203_cast_fp16 = silu(x = add_45_cast_fp16)[name = tensor("input_203_cast_fp16")]; + tensor var_4389 = const()[name = tensor("op_4389"), val = tensor([1, 1])]; + tensor var_4391 = const()[name = tensor("op_4391"), val = tensor([1, 1])]; + tensor hidden_states_117_pad_type_0 = const()[name = tensor("hidden_states_117_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_117_pad_0 = const()[name = tensor("hidden_states_117_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor mid_block_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("mid_block_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(507968448)))]; + tensor mid_block_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("mid_block_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(537459712)))]; + tensor hidden_states_117_cast_fp16 = conv(bias = mid_block_resnets_0_conv1_bias_to_fp16, dilations = var_4391, groups = var_4371, pad = hidden_states_117_pad_0, pad_type = hidden_states_117_pad_type_0, strides = var_4389, weight = mid_block_resnets_0_conv1_weight_to_fp16, x = input_203_cast_fp16)[name = tensor("hidden_states_117_cast_fp16")]; + tensor var_4397 = const()[name = tensor("op_4397"), val = tensor([1, 1])]; + tensor var_4399 = const()[name = tensor("op_4399"), val = tensor([1, 1])]; + tensor temb_17_pad_type_0 = const()[name = tensor("temb_17_pad_type_0"), val = tensor("custom")]; + tensor temb_17_pad_0 = const()[name = tensor("temb_17_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("mid_block_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(537462336)))]; + tensor mid_block_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("mid_block_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(540739200)))]; + tensor temb_17_cast_fp16 = conv(bias = mid_block_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_4399, groups = var_4371, pad = temb_17_pad_0, pad_type = temb_17_pad_type_0, strides = var_4397, weight = mid_block_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_17_cast_fp16")]; + tensor input_207_cast_fp16 = add(x = hidden_states_117_cast_fp16, y = temb_17_cast_fp16)[name = tensor("input_207_cast_fp16")]; + tensor reshape_92_shape_0 = const()[name = tensor("reshape_92_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_92_cast_fp16 = reshape(shape = reshape_92_shape_0, x = input_207_cast_fp16)[name = tensor("reshape_92_cast_fp16")]; + tensor reduce_mean_69_axes_0 = const()[name = tensor("reduce_mean_69_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_69_keep_dims_0 = const()[name = tensor("reduce_mean_69_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_69_cast_fp16 = reduce_mean(axes = reduce_mean_69_axes_0, keep_dims = reduce_mean_69_keep_dims_0, x = reshape_92_cast_fp16)[name = tensor("reduce_mean_69_cast_fp16")]; + tensor sub_46_cast_fp16 = sub(x = reshape_92_cast_fp16, y = reduce_mean_69_cast_fp16)[name = tensor("sub_46_cast_fp16")]; + tensor square_23_cast_fp16 = square(x = sub_46_cast_fp16)[name = tensor("square_23_cast_fp16")]; + tensor reduce_mean_71_axes_0 = const()[name = tensor("reduce_mean_71_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_71_keep_dims_0 = const()[name = tensor("reduce_mean_71_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_71_cast_fp16 = reduce_mean(axes = reduce_mean_71_axes_0, keep_dims = reduce_mean_71_keep_dims_0, x = square_23_cast_fp16)[name = tensor("reduce_mean_71_cast_fp16")]; + tensor add_46_y_0_to_fp16 = const()[name = tensor("add_46_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_46_cast_fp16 = add(x = reduce_mean_71_cast_fp16, y = add_46_y_0_to_fp16)[name = tensor("add_46_cast_fp16")]; + tensor sqrt_23_cast_fp16 = sqrt(x = add_46_cast_fp16)[name = tensor("sqrt_23_cast_fp16")]; + tensor real_div_23_cast_fp16 = real_div(x = sub_46_cast_fp16, y = sqrt_23_cast_fp16)[name = tensor("real_div_23_cast_fp16")]; + tensor reshape_93_shape_0 = const()[name = tensor("reshape_93_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_93_cast_fp16 = reshape(shape = reshape_93_shape_0, x = real_div_23_cast_fp16)[name = tensor("reshape_93_cast_fp16")]; + tensor add_47_gamma_0_to_fp16 = const()[name = tensor("add_47_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(540741824)))]; + tensor add_47_beta_0_to_fp16 = const()[name = tensor("add_47_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(540744448)))]; + tensor add_47_epsilon_0_to_fp16 = const()[name = tensor("add_47_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_47_cast_fp16 = batch_norm(beta = add_47_beta_0_to_fp16, epsilon = add_47_epsilon_0_to_fp16, gamma = add_47_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_93_cast_fp16)[name = tensor("add_47_cast_fp16")]; + tensor input_211_cast_fp16 = silu(x = add_47_cast_fp16)[name = tensor("input_211_cast_fp16")]; + tensor var_4409 = const()[name = tensor("op_4409"), val = tensor([1, 1])]; + tensor var_4411 = const()[name = tensor("op_4411"), val = tensor([1, 1])]; + tensor hidden_states_119_pad_type_0 = const()[name = tensor("hidden_states_119_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_119_pad_0 = const()[name = tensor("hidden_states_119_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor mid_block_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("mid_block_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(540747072)))]; + tensor mid_block_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("mid_block_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570238336)))]; + tensor hidden_states_119_cast_fp16 = conv(bias = mid_block_resnets_0_conv2_bias_to_fp16, dilations = var_4411, groups = var_4371, pad = hidden_states_119_pad_0, pad_type = hidden_states_119_pad_type_0, strides = var_4409, weight = mid_block_resnets_0_conv2_weight_to_fp16, x = input_211_cast_fp16)[name = tensor("hidden_states_119_cast_fp16")]; + tensor hidden_states_121_cast_fp16 = add(x = input_199_cast_fp16, y = hidden_states_119_cast_fp16)[name = tensor("hidden_states_121_cast_fp16")]; + tensor reshape_96_shape_0 = const()[name = tensor("reshape_96_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_96_cast_fp16 = reshape(shape = reshape_96_shape_0, x = hidden_states_121_cast_fp16)[name = tensor("reshape_96_cast_fp16")]; + tensor reduce_mean_72_axes_0 = const()[name = tensor("reduce_mean_72_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_72_keep_dims_0 = const()[name = tensor("reduce_mean_72_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_72_cast_fp16 = reduce_mean(axes = reduce_mean_72_axes_0, keep_dims = reduce_mean_72_keep_dims_0, x = reshape_96_cast_fp16)[name = tensor("reduce_mean_72_cast_fp16")]; + tensor sub_48_cast_fp16 = sub(x = reshape_96_cast_fp16, y = reduce_mean_72_cast_fp16)[name = tensor("sub_48_cast_fp16")]; + tensor square_24_cast_fp16 = square(x = sub_48_cast_fp16)[name = tensor("square_24_cast_fp16")]; + tensor reduce_mean_74_axes_0 = const()[name = tensor("reduce_mean_74_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_74_keep_dims_0 = const()[name = tensor("reduce_mean_74_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_74_cast_fp16 = reduce_mean(axes = reduce_mean_74_axes_0, keep_dims = reduce_mean_74_keep_dims_0, x = square_24_cast_fp16)[name = tensor("reduce_mean_74_cast_fp16")]; + tensor add_48_y_0_to_fp16 = const()[name = tensor("add_48_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_48_cast_fp16 = add(x = reduce_mean_74_cast_fp16, y = add_48_y_0_to_fp16)[name = tensor("add_48_cast_fp16")]; + tensor sqrt_24_cast_fp16 = sqrt(x = add_48_cast_fp16)[name = tensor("sqrt_24_cast_fp16")]; + tensor real_div_24_cast_fp16 = real_div(x = sub_48_cast_fp16, y = sqrt_24_cast_fp16)[name = tensor("real_div_24_cast_fp16")]; + tensor reshape_97_shape_0 = const()[name = tensor("reshape_97_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_97_cast_fp16 = reshape(shape = reshape_97_shape_0, x = real_div_24_cast_fp16)[name = tensor("reshape_97_cast_fp16")]; + tensor add_49_gamma_0_to_fp16 = const()[name = tensor("add_49_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570240960)))]; + tensor add_49_beta_0_to_fp16 = const()[name = tensor("add_49_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570243584)))]; + tensor add_49_epsilon_0_to_fp16 = const()[name = tensor("add_49_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_49_cast_fp16 = batch_norm(beta = add_49_beta_0_to_fp16, epsilon = add_49_epsilon_0_to_fp16, gamma = add_49_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_97_cast_fp16)[name = tensor("add_49_cast_fp16")]; + tensor var_4431 = const()[name = tensor("op_4431"), val = tensor([1, 1])]; + tensor var_4433 = const()[name = tensor("op_4433"), val = tensor([1, 1])]; + tensor hidden_states_123_pad_type_0 = const()[name = tensor("hidden_states_123_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_123_pad_0 = const()[name = tensor("hidden_states_123_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_proj_in_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570246208)))]; + tensor mid_block_attentions_0_proj_in_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(573523072)))]; + tensor hidden_states_123_cast_fp16 = conv(bias = mid_block_attentions_0_proj_in_bias_to_fp16, dilations = var_4433, groups = var_4371, pad = hidden_states_123_pad_0, pad_type = hidden_states_123_pad_type_0, strides = var_4431, weight = mid_block_attentions_0_proj_in_weight_to_fp16, x = add_49_cast_fp16)[name = tensor("hidden_states_123_cast_fp16")]; + tensor var_4438 = const()[name = tensor("op_4438"), val = tensor([2, 1280, 1, 36])]; + tensor inputs_37_cast_fp16 = reshape(shape = var_4438, x = hidden_states_123_cast_fp16)[name = tensor("inputs_37_cast_fp16")]; + tensor var_4448 = const()[name = tensor("op_4448"), val = tensor([1])]; + tensor channels_mean_37_cast_fp16 = reduce_mean(axes = var_4448, keep_dims = var_4366, x = inputs_37_cast_fp16)[name = tensor("channels_mean_37_cast_fp16")]; + tensor zero_mean_37_cast_fp16 = sub(x = inputs_37_cast_fp16, y = channels_mean_37_cast_fp16)[name = tensor("zero_mean_37_cast_fp16")]; + tensor zero_mean_sq_37_cast_fp16 = mul(x = zero_mean_37_cast_fp16, y = zero_mean_37_cast_fp16)[name = tensor("zero_mean_sq_37_cast_fp16")]; + tensor var_4452 = const()[name = tensor("op_4452"), val = tensor([1])]; + tensor var_4453_cast_fp16 = reduce_mean(axes = var_4452, keep_dims = var_4366, x = zero_mean_sq_37_cast_fp16)[name = tensor("op_4453_cast_fp16")]; + tensor var_4454_to_fp16 = const()[name = tensor("op_4454_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_4455_cast_fp16 = add(x = var_4453_cast_fp16, y = var_4454_to_fp16)[name = tensor("op_4455_cast_fp16")]; + tensor denom_37_epsilon_0_to_fp16 = const()[name = tensor("denom_37_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_37_cast_fp16 = rsqrt(epsilon = denom_37_epsilon_0_to_fp16, x = var_4455_cast_fp16)[name = tensor("denom_37_cast_fp16")]; + tensor out_37_cast_fp16 = mul(x = zero_mean_37_cast_fp16, y = denom_37_cast_fp16)[name = tensor("out_37_cast_fp16")]; + tensor var_4459_to_fp16 = const()[name = tensor("op_4459_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(573525696)))]; + tensor var_4460_cast_fp16 = add(x = out_37_cast_fp16, y = var_4459_to_fp16)[name = tensor("op_4460_cast_fp16")]; + tensor var_4462_to_fp16 = const()[name = tensor("op_4462_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(573528320)))]; + tensor hidden_states_125_cast_fp16 = mul(x = var_4460_cast_fp16, y = var_4462_to_fp16)[name = tensor("hidden_states_125_cast_fp16")]; + tensor var_4469 = const()[name = tensor("op_4469"), val = tensor([1, 1])]; + tensor var_4471 = const()[name = tensor("op_4471"), val = tensor([1, 1])]; + tensor q_25_pad_type_0 = const()[name = tensor("q_25_pad_type_0"), val = tensor("custom")]; + tensor q_25_pad_0 = const()[name = tensor("q_25_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(573530944)))]; + tensor q_25_cast_fp16 = conv(dilations = var_4471, groups = var_4371, pad = q_25_pad_0, pad_type = q_25_pad_type_0, strides = var_4469, weight = mid_block_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_125_cast_fp16)[name = tensor("q_25_cast_fp16")]; + tensor var_4475 = const()[name = tensor("op_4475"), val = tensor([1, 1])]; + tensor var_4477 = const()[name = tensor("op_4477"), val = tensor([1, 1])]; + tensor k_49_pad_type_0 = const()[name = tensor("k_49_pad_type_0"), val = tensor("custom")]; + tensor k_49_pad_0 = const()[name = tensor("k_49_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(576807808)))]; + tensor k_49_cast_fp16 = conv(dilations = var_4477, groups = var_4371, pad = k_49_pad_0, pad_type = k_49_pad_type_0, strides = var_4475, weight = mid_block_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_125_cast_fp16)[name = tensor("k_49_cast_fp16")]; + tensor var_4481 = const()[name = tensor("op_4481"), val = tensor([1, 1])]; + tensor var_4483 = const()[name = tensor("op_4483"), val = tensor([1, 1])]; + tensor v_25_pad_type_0 = const()[name = tensor("v_25_pad_type_0"), val = tensor("custom")]; + tensor v_25_pad_0 = const()[name = tensor("v_25_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(580084672)))]; + tensor v_25_cast_fp16 = conv(dilations = var_4483, groups = var_4371, pad = v_25_pad_0, pad_type = v_25_pad_type_0, strides = var_4481, weight = mid_block_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_125_cast_fp16)[name = tensor("v_25_cast_fp16")]; + tensor var_4487_begin_0 = const()[name = tensor("op_4487_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_4487_end_0 = const()[name = tensor("op_4487_end_0"), val = tensor([2, 64, 1, 36])]; + tensor var_4487_end_mask_0 = const()[name = tensor("op_4487_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4487_cast_fp16 = slice_by_index(begin = var_4487_begin_0, end = var_4487_end_0, end_mask = var_4487_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4487_cast_fp16")]; + tensor var_4491_begin_0 = const()[name = tensor("op_4491_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_4491_end_0 = const()[name = tensor("op_4491_end_0"), val = tensor([2, 128, 1, 36])]; + tensor var_4491_end_mask_0 = const()[name = tensor("op_4491_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4491_cast_fp16 = slice_by_index(begin = var_4491_begin_0, end = var_4491_end_0, end_mask = var_4491_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4491_cast_fp16")]; + tensor var_4495_begin_0 = const()[name = tensor("op_4495_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_4495_end_0 = const()[name = tensor("op_4495_end_0"), val = tensor([2, 192, 1, 36])]; + tensor var_4495_end_mask_0 = const()[name = tensor("op_4495_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4495_cast_fp16 = slice_by_index(begin = var_4495_begin_0, end = var_4495_end_0, end_mask = var_4495_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4495_cast_fp16")]; + tensor var_4499_begin_0 = const()[name = tensor("op_4499_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_4499_end_0 = const()[name = tensor("op_4499_end_0"), val = tensor([2, 256, 1, 36])]; + tensor var_4499_end_mask_0 = const()[name = tensor("op_4499_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4499_cast_fp16 = slice_by_index(begin = var_4499_begin_0, end = var_4499_end_0, end_mask = var_4499_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4499_cast_fp16")]; + tensor var_4503_begin_0 = const()[name = tensor("op_4503_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_4503_end_0 = const()[name = tensor("op_4503_end_0"), val = tensor([2, 320, 1, 36])]; + tensor var_4503_end_mask_0 = const()[name = tensor("op_4503_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4503_cast_fp16 = slice_by_index(begin = var_4503_begin_0, end = var_4503_end_0, end_mask = var_4503_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4503_cast_fp16")]; + tensor var_4507_begin_0 = const()[name = tensor("op_4507_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_4507_end_0 = const()[name = tensor("op_4507_end_0"), val = tensor([2, 384, 1, 36])]; + tensor var_4507_end_mask_0 = const()[name = tensor("op_4507_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4507_cast_fp16 = slice_by_index(begin = var_4507_begin_0, end = var_4507_end_0, end_mask = var_4507_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4507_cast_fp16")]; + tensor var_4511_begin_0 = const()[name = tensor("op_4511_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_4511_end_0 = const()[name = tensor("op_4511_end_0"), val = tensor([2, 448, 1, 36])]; + tensor var_4511_end_mask_0 = const()[name = tensor("op_4511_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4511_cast_fp16 = slice_by_index(begin = var_4511_begin_0, end = var_4511_end_0, end_mask = var_4511_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4511_cast_fp16")]; + tensor var_4515_begin_0 = const()[name = tensor("op_4515_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_4515_end_0 = const()[name = tensor("op_4515_end_0"), val = tensor([2, 512, 1, 36])]; + tensor var_4515_end_mask_0 = const()[name = tensor("op_4515_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4515_cast_fp16 = slice_by_index(begin = var_4515_begin_0, end = var_4515_end_0, end_mask = var_4515_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4515_cast_fp16")]; + tensor var_4519_begin_0 = const()[name = tensor("op_4519_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_4519_end_0 = const()[name = tensor("op_4519_end_0"), val = tensor([2, 576, 1, 36])]; + tensor var_4519_end_mask_0 = const()[name = tensor("op_4519_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4519_cast_fp16 = slice_by_index(begin = var_4519_begin_0, end = var_4519_end_0, end_mask = var_4519_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4519_cast_fp16")]; + tensor var_4523_begin_0 = const()[name = tensor("op_4523_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_4523_end_0 = const()[name = tensor("op_4523_end_0"), val = tensor([2, 640, 1, 36])]; + tensor var_4523_end_mask_0 = const()[name = tensor("op_4523_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4523_cast_fp16 = slice_by_index(begin = var_4523_begin_0, end = var_4523_end_0, end_mask = var_4523_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4523_cast_fp16")]; + tensor var_4527_begin_0 = const()[name = tensor("op_4527_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_4527_end_0 = const()[name = tensor("op_4527_end_0"), val = tensor([2, 704, 1, 36])]; + tensor var_4527_end_mask_0 = const()[name = tensor("op_4527_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4527_cast_fp16 = slice_by_index(begin = var_4527_begin_0, end = var_4527_end_0, end_mask = var_4527_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4527_cast_fp16")]; + tensor var_4531_begin_0 = const()[name = tensor("op_4531_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_4531_end_0 = const()[name = tensor("op_4531_end_0"), val = tensor([2, 768, 1, 36])]; + tensor var_4531_end_mask_0 = const()[name = tensor("op_4531_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4531_cast_fp16 = slice_by_index(begin = var_4531_begin_0, end = var_4531_end_0, end_mask = var_4531_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4531_cast_fp16")]; + tensor var_4535_begin_0 = const()[name = tensor("op_4535_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_4535_end_0 = const()[name = tensor("op_4535_end_0"), val = tensor([2, 832, 1, 36])]; + tensor var_4535_end_mask_0 = const()[name = tensor("op_4535_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4535_cast_fp16 = slice_by_index(begin = var_4535_begin_0, end = var_4535_end_0, end_mask = var_4535_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4535_cast_fp16")]; + tensor var_4539_begin_0 = const()[name = tensor("op_4539_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_4539_end_0 = const()[name = tensor("op_4539_end_0"), val = tensor([2, 896, 1, 36])]; + tensor var_4539_end_mask_0 = const()[name = tensor("op_4539_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4539_cast_fp16 = slice_by_index(begin = var_4539_begin_0, end = var_4539_end_0, end_mask = var_4539_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4539_cast_fp16")]; + tensor var_4543_begin_0 = const()[name = tensor("op_4543_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_4543_end_0 = const()[name = tensor("op_4543_end_0"), val = tensor([2, 960, 1, 36])]; + tensor var_4543_end_mask_0 = const()[name = tensor("op_4543_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4543_cast_fp16 = slice_by_index(begin = var_4543_begin_0, end = var_4543_end_0, end_mask = var_4543_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4543_cast_fp16")]; + tensor var_4547_begin_0 = const()[name = tensor("op_4547_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_4547_end_0 = const()[name = tensor("op_4547_end_0"), val = tensor([2, 1024, 1, 36])]; + tensor var_4547_end_mask_0 = const()[name = tensor("op_4547_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4547_cast_fp16 = slice_by_index(begin = var_4547_begin_0, end = var_4547_end_0, end_mask = var_4547_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4547_cast_fp16")]; + tensor var_4551_begin_0 = const()[name = tensor("op_4551_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_4551_end_0 = const()[name = tensor("op_4551_end_0"), val = tensor([2, 1088, 1, 36])]; + tensor var_4551_end_mask_0 = const()[name = tensor("op_4551_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4551_cast_fp16 = slice_by_index(begin = var_4551_begin_0, end = var_4551_end_0, end_mask = var_4551_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4551_cast_fp16")]; + tensor var_4555_begin_0 = const()[name = tensor("op_4555_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_4555_end_0 = const()[name = tensor("op_4555_end_0"), val = tensor([2, 1152, 1, 36])]; + tensor var_4555_end_mask_0 = const()[name = tensor("op_4555_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4555_cast_fp16 = slice_by_index(begin = var_4555_begin_0, end = var_4555_end_0, end_mask = var_4555_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4555_cast_fp16")]; + tensor var_4559_begin_0 = const()[name = tensor("op_4559_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_4559_end_0 = const()[name = tensor("op_4559_end_0"), val = tensor([2, 1216, 1, 36])]; + tensor var_4559_end_mask_0 = const()[name = tensor("op_4559_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4559_cast_fp16 = slice_by_index(begin = var_4559_begin_0, end = var_4559_end_0, end_mask = var_4559_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4559_cast_fp16")]; + tensor var_4563_begin_0 = const()[name = tensor("op_4563_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_4563_end_0 = const()[name = tensor("op_4563_end_0"), val = tensor([2, 1280, 1, 36])]; + tensor var_4563_end_mask_0 = const()[name = tensor("op_4563_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4563_cast_fp16 = slice_by_index(begin = var_4563_begin_0, end = var_4563_end_0, end_mask = var_4563_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4563_cast_fp16")]; + tensor k_51_perm_0 = const()[name = tensor("k_51_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_4570_begin_0 = const()[name = tensor("op_4570_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_4570_end_0 = const()[name = tensor("op_4570_end_0"), val = tensor([2, 36, 1, 64])]; + tensor var_4570_end_mask_0 = const()[name = tensor("op_4570_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_19 = transpose(perm = k_51_perm_0, x = k_49_cast_fp16)[name = tensor("transpose_19")]; + tensor var_4570_cast_fp16 = slice_by_index(begin = var_4570_begin_0, end = var_4570_end_0, end_mask = var_4570_end_mask_0, x = transpose_19)[name = tensor("op_4570_cast_fp16")]; + tensor var_4574_begin_0 = const()[name = tensor("op_4574_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_4574_end_0 = const()[name = tensor("op_4574_end_0"), val = tensor([2, 36, 1, 128])]; + tensor var_4574_end_mask_0 = const()[name = tensor("op_4574_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4574_cast_fp16 = slice_by_index(begin = var_4574_begin_0, end = var_4574_end_0, end_mask = var_4574_end_mask_0, x = transpose_19)[name = tensor("op_4574_cast_fp16")]; + tensor var_4578_begin_0 = const()[name = tensor("op_4578_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_4578_end_0 = const()[name = tensor("op_4578_end_0"), val = tensor([2, 36, 1, 192])]; + tensor var_4578_end_mask_0 = const()[name = tensor("op_4578_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4578_cast_fp16 = slice_by_index(begin = var_4578_begin_0, end = var_4578_end_0, end_mask = var_4578_end_mask_0, x = transpose_19)[name = tensor("op_4578_cast_fp16")]; + tensor var_4582_begin_0 = const()[name = tensor("op_4582_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_4582_end_0 = const()[name = tensor("op_4582_end_0"), val = tensor([2, 36, 1, 256])]; + tensor var_4582_end_mask_0 = const()[name = tensor("op_4582_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4582_cast_fp16 = slice_by_index(begin = var_4582_begin_0, end = var_4582_end_0, end_mask = var_4582_end_mask_0, x = transpose_19)[name = tensor("op_4582_cast_fp16")]; + tensor var_4586_begin_0 = const()[name = tensor("op_4586_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_4586_end_0 = const()[name = tensor("op_4586_end_0"), val = tensor([2, 36, 1, 320])]; + tensor var_4586_end_mask_0 = const()[name = tensor("op_4586_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4586_cast_fp16 = slice_by_index(begin = var_4586_begin_0, end = var_4586_end_0, end_mask = var_4586_end_mask_0, x = transpose_19)[name = tensor("op_4586_cast_fp16")]; + tensor var_4590_begin_0 = const()[name = tensor("op_4590_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_4590_end_0 = const()[name = tensor("op_4590_end_0"), val = tensor([2, 36, 1, 384])]; + tensor var_4590_end_mask_0 = const()[name = tensor("op_4590_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4590_cast_fp16 = slice_by_index(begin = var_4590_begin_0, end = var_4590_end_0, end_mask = var_4590_end_mask_0, x = transpose_19)[name = tensor("op_4590_cast_fp16")]; + tensor var_4594_begin_0 = const()[name = tensor("op_4594_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_4594_end_0 = const()[name = tensor("op_4594_end_0"), val = tensor([2, 36, 1, 448])]; + tensor var_4594_end_mask_0 = const()[name = tensor("op_4594_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4594_cast_fp16 = slice_by_index(begin = var_4594_begin_0, end = var_4594_end_0, end_mask = var_4594_end_mask_0, x = transpose_19)[name = tensor("op_4594_cast_fp16")]; + tensor var_4598_begin_0 = const()[name = tensor("op_4598_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_4598_end_0 = const()[name = tensor("op_4598_end_0"), val = tensor([2, 36, 1, 512])]; + tensor var_4598_end_mask_0 = const()[name = tensor("op_4598_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4598_cast_fp16 = slice_by_index(begin = var_4598_begin_0, end = var_4598_end_0, end_mask = var_4598_end_mask_0, x = transpose_19)[name = tensor("op_4598_cast_fp16")]; + tensor var_4602_begin_0 = const()[name = tensor("op_4602_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_4602_end_0 = const()[name = tensor("op_4602_end_0"), val = tensor([2, 36, 1, 576])]; + tensor var_4602_end_mask_0 = const()[name = tensor("op_4602_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4602_cast_fp16 = slice_by_index(begin = var_4602_begin_0, end = var_4602_end_0, end_mask = var_4602_end_mask_0, x = transpose_19)[name = tensor("op_4602_cast_fp16")]; + tensor var_4606_begin_0 = const()[name = tensor("op_4606_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_4606_end_0 = const()[name = tensor("op_4606_end_0"), val = tensor([2, 36, 1, 640])]; + tensor var_4606_end_mask_0 = const()[name = tensor("op_4606_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4606_cast_fp16 = slice_by_index(begin = var_4606_begin_0, end = var_4606_end_0, end_mask = var_4606_end_mask_0, x = transpose_19)[name = tensor("op_4606_cast_fp16")]; + tensor var_4610_begin_0 = const()[name = tensor("op_4610_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_4610_end_0 = const()[name = tensor("op_4610_end_0"), val = tensor([2, 36, 1, 704])]; + tensor var_4610_end_mask_0 = const()[name = tensor("op_4610_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4610_cast_fp16 = slice_by_index(begin = var_4610_begin_0, end = var_4610_end_0, end_mask = var_4610_end_mask_0, x = transpose_19)[name = tensor("op_4610_cast_fp16")]; + tensor var_4614_begin_0 = const()[name = tensor("op_4614_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_4614_end_0 = const()[name = tensor("op_4614_end_0"), val = tensor([2, 36, 1, 768])]; + tensor var_4614_end_mask_0 = const()[name = tensor("op_4614_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4614_cast_fp16 = slice_by_index(begin = var_4614_begin_0, end = var_4614_end_0, end_mask = var_4614_end_mask_0, x = transpose_19)[name = tensor("op_4614_cast_fp16")]; + tensor var_4618_begin_0 = const()[name = tensor("op_4618_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_4618_end_0 = const()[name = tensor("op_4618_end_0"), val = tensor([2, 36, 1, 832])]; + tensor var_4618_end_mask_0 = const()[name = tensor("op_4618_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4618_cast_fp16 = slice_by_index(begin = var_4618_begin_0, end = var_4618_end_0, end_mask = var_4618_end_mask_0, x = transpose_19)[name = tensor("op_4618_cast_fp16")]; + tensor var_4622_begin_0 = const()[name = tensor("op_4622_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_4622_end_0 = const()[name = tensor("op_4622_end_0"), val = tensor([2, 36, 1, 896])]; + tensor var_4622_end_mask_0 = const()[name = tensor("op_4622_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4622_cast_fp16 = slice_by_index(begin = var_4622_begin_0, end = var_4622_end_0, end_mask = var_4622_end_mask_0, x = transpose_19)[name = tensor("op_4622_cast_fp16")]; + tensor var_4626_begin_0 = const()[name = tensor("op_4626_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_4626_end_0 = const()[name = tensor("op_4626_end_0"), val = tensor([2, 36, 1, 960])]; + tensor var_4626_end_mask_0 = const()[name = tensor("op_4626_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4626_cast_fp16 = slice_by_index(begin = var_4626_begin_0, end = var_4626_end_0, end_mask = var_4626_end_mask_0, x = transpose_19)[name = tensor("op_4626_cast_fp16")]; + tensor var_4630_begin_0 = const()[name = tensor("op_4630_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_4630_end_0 = const()[name = tensor("op_4630_end_0"), val = tensor([2, 36, 1, 1024])]; + tensor var_4630_end_mask_0 = const()[name = tensor("op_4630_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4630_cast_fp16 = slice_by_index(begin = var_4630_begin_0, end = var_4630_end_0, end_mask = var_4630_end_mask_0, x = transpose_19)[name = tensor("op_4630_cast_fp16")]; + tensor var_4634_begin_0 = const()[name = tensor("op_4634_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_4634_end_0 = const()[name = tensor("op_4634_end_0"), val = tensor([2, 36, 1, 1088])]; + tensor var_4634_end_mask_0 = const()[name = tensor("op_4634_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4634_cast_fp16 = slice_by_index(begin = var_4634_begin_0, end = var_4634_end_0, end_mask = var_4634_end_mask_0, x = transpose_19)[name = tensor("op_4634_cast_fp16")]; + tensor var_4638_begin_0 = const()[name = tensor("op_4638_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_4638_end_0 = const()[name = tensor("op_4638_end_0"), val = tensor([2, 36, 1, 1152])]; + tensor var_4638_end_mask_0 = const()[name = tensor("op_4638_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4638_cast_fp16 = slice_by_index(begin = var_4638_begin_0, end = var_4638_end_0, end_mask = var_4638_end_mask_0, x = transpose_19)[name = tensor("op_4638_cast_fp16")]; + tensor var_4642_begin_0 = const()[name = tensor("op_4642_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_4642_end_0 = const()[name = tensor("op_4642_end_0"), val = tensor([2, 36, 1, 1216])]; + tensor var_4642_end_mask_0 = const()[name = tensor("op_4642_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4642_cast_fp16 = slice_by_index(begin = var_4642_begin_0, end = var_4642_end_0, end_mask = var_4642_end_mask_0, x = transpose_19)[name = tensor("op_4642_cast_fp16")]; + tensor var_4646_begin_0 = const()[name = tensor("op_4646_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_4646_end_0 = const()[name = tensor("op_4646_end_0"), val = tensor([2, 36, 1, 1280])]; + tensor var_4646_end_mask_0 = const()[name = tensor("op_4646_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_4646_cast_fp16 = slice_by_index(begin = var_4646_begin_0, end = var_4646_end_0, end_mask = var_4646_end_mask_0, x = transpose_19)[name = tensor("op_4646_cast_fp16")]; + tensor var_4648_begin_0 = const()[name = tensor("op_4648_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_4648_end_0 = const()[name = tensor("op_4648_end_0"), val = tensor([2, 64, 1, 36])]; + tensor var_4648_end_mask_0 = const()[name = tensor("op_4648_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4648_cast_fp16 = slice_by_index(begin = var_4648_begin_0, end = var_4648_end_0, end_mask = var_4648_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4648_cast_fp16")]; + tensor var_4652_begin_0 = const()[name = tensor("op_4652_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_4652_end_0 = const()[name = tensor("op_4652_end_0"), val = tensor([2, 128, 1, 36])]; + tensor var_4652_end_mask_0 = const()[name = tensor("op_4652_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4652_cast_fp16 = slice_by_index(begin = var_4652_begin_0, end = var_4652_end_0, end_mask = var_4652_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4652_cast_fp16")]; + tensor var_4656_begin_0 = const()[name = tensor("op_4656_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_4656_end_0 = const()[name = tensor("op_4656_end_0"), val = tensor([2, 192, 1, 36])]; + tensor var_4656_end_mask_0 = const()[name = tensor("op_4656_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4656_cast_fp16 = slice_by_index(begin = var_4656_begin_0, end = var_4656_end_0, end_mask = var_4656_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4656_cast_fp16")]; + tensor var_4660_begin_0 = const()[name = tensor("op_4660_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_4660_end_0 = const()[name = tensor("op_4660_end_0"), val = tensor([2, 256, 1, 36])]; + tensor var_4660_end_mask_0 = const()[name = tensor("op_4660_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4660_cast_fp16 = slice_by_index(begin = var_4660_begin_0, end = var_4660_end_0, end_mask = var_4660_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4660_cast_fp16")]; + tensor var_4664_begin_0 = const()[name = tensor("op_4664_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_4664_end_0 = const()[name = tensor("op_4664_end_0"), val = tensor([2, 320, 1, 36])]; + tensor var_4664_end_mask_0 = const()[name = tensor("op_4664_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4664_cast_fp16 = slice_by_index(begin = var_4664_begin_0, end = var_4664_end_0, end_mask = var_4664_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4664_cast_fp16")]; + tensor var_4668_begin_0 = const()[name = tensor("op_4668_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_4668_end_0 = const()[name = tensor("op_4668_end_0"), val = tensor([2, 384, 1, 36])]; + tensor var_4668_end_mask_0 = const()[name = tensor("op_4668_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4668_cast_fp16 = slice_by_index(begin = var_4668_begin_0, end = var_4668_end_0, end_mask = var_4668_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4668_cast_fp16")]; + tensor var_4672_begin_0 = const()[name = tensor("op_4672_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_4672_end_0 = const()[name = tensor("op_4672_end_0"), val = tensor([2, 448, 1, 36])]; + tensor var_4672_end_mask_0 = const()[name = tensor("op_4672_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4672_cast_fp16 = slice_by_index(begin = var_4672_begin_0, end = var_4672_end_0, end_mask = var_4672_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4672_cast_fp16")]; + tensor var_4676_begin_0 = const()[name = tensor("op_4676_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_4676_end_0 = const()[name = tensor("op_4676_end_0"), val = tensor([2, 512, 1, 36])]; + tensor var_4676_end_mask_0 = const()[name = tensor("op_4676_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4676_cast_fp16 = slice_by_index(begin = var_4676_begin_0, end = var_4676_end_0, end_mask = var_4676_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4676_cast_fp16")]; + tensor var_4680_begin_0 = const()[name = tensor("op_4680_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_4680_end_0 = const()[name = tensor("op_4680_end_0"), val = tensor([2, 576, 1, 36])]; + tensor var_4680_end_mask_0 = const()[name = tensor("op_4680_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4680_cast_fp16 = slice_by_index(begin = var_4680_begin_0, end = var_4680_end_0, end_mask = var_4680_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4680_cast_fp16")]; + tensor var_4684_begin_0 = const()[name = tensor("op_4684_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_4684_end_0 = const()[name = tensor("op_4684_end_0"), val = tensor([2, 640, 1, 36])]; + tensor var_4684_end_mask_0 = const()[name = tensor("op_4684_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4684_cast_fp16 = slice_by_index(begin = var_4684_begin_0, end = var_4684_end_0, end_mask = var_4684_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4684_cast_fp16")]; + tensor var_4688_begin_0 = const()[name = tensor("op_4688_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_4688_end_0 = const()[name = tensor("op_4688_end_0"), val = tensor([2, 704, 1, 36])]; + tensor var_4688_end_mask_0 = const()[name = tensor("op_4688_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4688_cast_fp16 = slice_by_index(begin = var_4688_begin_0, end = var_4688_end_0, end_mask = var_4688_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4688_cast_fp16")]; + tensor var_4692_begin_0 = const()[name = tensor("op_4692_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_4692_end_0 = const()[name = tensor("op_4692_end_0"), val = tensor([2, 768, 1, 36])]; + tensor var_4692_end_mask_0 = const()[name = tensor("op_4692_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4692_cast_fp16 = slice_by_index(begin = var_4692_begin_0, end = var_4692_end_0, end_mask = var_4692_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4692_cast_fp16")]; + tensor var_4696_begin_0 = const()[name = tensor("op_4696_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_4696_end_0 = const()[name = tensor("op_4696_end_0"), val = tensor([2, 832, 1, 36])]; + tensor var_4696_end_mask_0 = const()[name = tensor("op_4696_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4696_cast_fp16 = slice_by_index(begin = var_4696_begin_0, end = var_4696_end_0, end_mask = var_4696_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4696_cast_fp16")]; + tensor var_4700_begin_0 = const()[name = tensor("op_4700_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_4700_end_0 = const()[name = tensor("op_4700_end_0"), val = tensor([2, 896, 1, 36])]; + tensor var_4700_end_mask_0 = const()[name = tensor("op_4700_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4700_cast_fp16 = slice_by_index(begin = var_4700_begin_0, end = var_4700_end_0, end_mask = var_4700_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4700_cast_fp16")]; + tensor var_4704_begin_0 = const()[name = tensor("op_4704_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_4704_end_0 = const()[name = tensor("op_4704_end_0"), val = tensor([2, 960, 1, 36])]; + tensor var_4704_end_mask_0 = const()[name = tensor("op_4704_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4704_cast_fp16 = slice_by_index(begin = var_4704_begin_0, end = var_4704_end_0, end_mask = var_4704_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4704_cast_fp16")]; + tensor var_4708_begin_0 = const()[name = tensor("op_4708_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_4708_end_0 = const()[name = tensor("op_4708_end_0"), val = tensor([2, 1024, 1, 36])]; + tensor var_4708_end_mask_0 = const()[name = tensor("op_4708_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4708_cast_fp16 = slice_by_index(begin = var_4708_begin_0, end = var_4708_end_0, end_mask = var_4708_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4708_cast_fp16")]; + tensor var_4712_begin_0 = const()[name = tensor("op_4712_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_4712_end_0 = const()[name = tensor("op_4712_end_0"), val = tensor([2, 1088, 1, 36])]; + tensor var_4712_end_mask_0 = const()[name = tensor("op_4712_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4712_cast_fp16 = slice_by_index(begin = var_4712_begin_0, end = var_4712_end_0, end_mask = var_4712_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4712_cast_fp16")]; + tensor var_4716_begin_0 = const()[name = tensor("op_4716_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_4716_end_0 = const()[name = tensor("op_4716_end_0"), val = tensor([2, 1152, 1, 36])]; + tensor var_4716_end_mask_0 = const()[name = tensor("op_4716_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4716_cast_fp16 = slice_by_index(begin = var_4716_begin_0, end = var_4716_end_0, end_mask = var_4716_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4716_cast_fp16")]; + tensor var_4720_begin_0 = const()[name = tensor("op_4720_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_4720_end_0 = const()[name = tensor("op_4720_end_0"), val = tensor([2, 1216, 1, 36])]; + tensor var_4720_end_mask_0 = const()[name = tensor("op_4720_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4720_cast_fp16 = slice_by_index(begin = var_4720_begin_0, end = var_4720_end_0, end_mask = var_4720_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4720_cast_fp16")]; + tensor var_4724_begin_0 = const()[name = tensor("op_4724_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_4724_end_0 = const()[name = tensor("op_4724_end_0"), val = tensor([2, 1280, 1, 36])]; + tensor var_4724_end_mask_0 = const()[name = tensor("op_4724_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4724_cast_fp16 = slice_by_index(begin = var_4724_begin_0, end = var_4724_end_0, end_mask = var_4724_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4724_cast_fp16")]; + tensor var_4728_equation_0 = const()[name = tensor("op_4728_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4728_cast_fp16 = einsum(equation = var_4728_equation_0, values = (var_4570_cast_fp16, var_4487_cast_fp16))[name = tensor("op_4728_cast_fp16")]; + tensor var_4729_to_fp16 = const()[name = tensor("op_4729_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_281_cast_fp16 = mul(x = var_4728_cast_fp16, y = var_4729_to_fp16)[name = tensor("aw_281_cast_fp16")]; + tensor var_4732_equation_0 = const()[name = tensor("op_4732_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4732_cast_fp16 = einsum(equation = var_4732_equation_0, values = (var_4574_cast_fp16, var_4491_cast_fp16))[name = tensor("op_4732_cast_fp16")]; + tensor var_4733_to_fp16 = const()[name = tensor("op_4733_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_283_cast_fp16 = mul(x = var_4732_cast_fp16, y = var_4733_to_fp16)[name = tensor("aw_283_cast_fp16")]; + tensor var_4736_equation_0 = const()[name = tensor("op_4736_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4736_cast_fp16 = einsum(equation = var_4736_equation_0, values = (var_4578_cast_fp16, var_4495_cast_fp16))[name = tensor("op_4736_cast_fp16")]; + tensor var_4737_to_fp16 = const()[name = tensor("op_4737_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_285_cast_fp16 = mul(x = var_4736_cast_fp16, y = var_4737_to_fp16)[name = tensor("aw_285_cast_fp16")]; + tensor var_4740_equation_0 = const()[name = tensor("op_4740_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4740_cast_fp16 = einsum(equation = var_4740_equation_0, values = (var_4582_cast_fp16, var_4499_cast_fp16))[name = tensor("op_4740_cast_fp16")]; + tensor var_4741_to_fp16 = const()[name = tensor("op_4741_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_287_cast_fp16 = mul(x = var_4740_cast_fp16, y = var_4741_to_fp16)[name = tensor("aw_287_cast_fp16")]; + tensor var_4744_equation_0 = const()[name = tensor("op_4744_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4744_cast_fp16 = einsum(equation = var_4744_equation_0, values = (var_4586_cast_fp16, var_4503_cast_fp16))[name = tensor("op_4744_cast_fp16")]; + tensor var_4745_to_fp16 = const()[name = tensor("op_4745_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_289_cast_fp16 = mul(x = var_4744_cast_fp16, y = var_4745_to_fp16)[name = tensor("aw_289_cast_fp16")]; + tensor var_4748_equation_0 = const()[name = tensor("op_4748_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4748_cast_fp16 = einsum(equation = var_4748_equation_0, values = (var_4590_cast_fp16, var_4507_cast_fp16))[name = tensor("op_4748_cast_fp16")]; + tensor var_4749_to_fp16 = const()[name = tensor("op_4749_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_291_cast_fp16 = mul(x = var_4748_cast_fp16, y = var_4749_to_fp16)[name = tensor("aw_291_cast_fp16")]; + tensor var_4752_equation_0 = const()[name = tensor("op_4752_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4752_cast_fp16 = einsum(equation = var_4752_equation_0, values = (var_4594_cast_fp16, var_4511_cast_fp16))[name = tensor("op_4752_cast_fp16")]; + tensor var_4753_to_fp16 = const()[name = tensor("op_4753_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_293_cast_fp16 = mul(x = var_4752_cast_fp16, y = var_4753_to_fp16)[name = tensor("aw_293_cast_fp16")]; + tensor var_4756_equation_0 = const()[name = tensor("op_4756_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4756_cast_fp16 = einsum(equation = var_4756_equation_0, values = (var_4598_cast_fp16, var_4515_cast_fp16))[name = tensor("op_4756_cast_fp16")]; + tensor var_4757_to_fp16 = const()[name = tensor("op_4757_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_295_cast_fp16 = mul(x = var_4756_cast_fp16, y = var_4757_to_fp16)[name = tensor("aw_295_cast_fp16")]; + tensor var_4760_equation_0 = const()[name = tensor("op_4760_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4760_cast_fp16 = einsum(equation = var_4760_equation_0, values = (var_4602_cast_fp16, var_4519_cast_fp16))[name = tensor("op_4760_cast_fp16")]; + tensor var_4761_to_fp16 = const()[name = tensor("op_4761_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_297_cast_fp16 = mul(x = var_4760_cast_fp16, y = var_4761_to_fp16)[name = tensor("aw_297_cast_fp16")]; + tensor var_4764_equation_0 = const()[name = tensor("op_4764_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4764_cast_fp16 = einsum(equation = var_4764_equation_0, values = (var_4606_cast_fp16, var_4523_cast_fp16))[name = tensor("op_4764_cast_fp16")]; + tensor var_4765_to_fp16 = const()[name = tensor("op_4765_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_299_cast_fp16 = mul(x = var_4764_cast_fp16, y = var_4765_to_fp16)[name = tensor("aw_299_cast_fp16")]; + tensor var_4768_equation_0 = const()[name = tensor("op_4768_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4768_cast_fp16 = einsum(equation = var_4768_equation_0, values = (var_4610_cast_fp16, var_4527_cast_fp16))[name = tensor("op_4768_cast_fp16")]; + tensor var_4769_to_fp16 = const()[name = tensor("op_4769_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_301_cast_fp16 = mul(x = var_4768_cast_fp16, y = var_4769_to_fp16)[name = tensor("aw_301_cast_fp16")]; + tensor var_4772_equation_0 = const()[name = tensor("op_4772_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4772_cast_fp16 = einsum(equation = var_4772_equation_0, values = (var_4614_cast_fp16, var_4531_cast_fp16))[name = tensor("op_4772_cast_fp16")]; + tensor var_4773_to_fp16 = const()[name = tensor("op_4773_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_303_cast_fp16 = mul(x = var_4772_cast_fp16, y = var_4773_to_fp16)[name = tensor("aw_303_cast_fp16")]; + tensor var_4776_equation_0 = const()[name = tensor("op_4776_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4776_cast_fp16 = einsum(equation = var_4776_equation_0, values = (var_4618_cast_fp16, var_4535_cast_fp16))[name = tensor("op_4776_cast_fp16")]; + tensor var_4777_to_fp16 = const()[name = tensor("op_4777_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_305_cast_fp16 = mul(x = var_4776_cast_fp16, y = var_4777_to_fp16)[name = tensor("aw_305_cast_fp16")]; + tensor var_4780_equation_0 = const()[name = tensor("op_4780_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4780_cast_fp16 = einsum(equation = var_4780_equation_0, values = (var_4622_cast_fp16, var_4539_cast_fp16))[name = tensor("op_4780_cast_fp16")]; + tensor var_4781_to_fp16 = const()[name = tensor("op_4781_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_307_cast_fp16 = mul(x = var_4780_cast_fp16, y = var_4781_to_fp16)[name = tensor("aw_307_cast_fp16")]; + tensor var_4784_equation_0 = const()[name = tensor("op_4784_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4784_cast_fp16 = einsum(equation = var_4784_equation_0, values = (var_4626_cast_fp16, var_4543_cast_fp16))[name = tensor("op_4784_cast_fp16")]; + tensor var_4785_to_fp16 = const()[name = tensor("op_4785_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_309_cast_fp16 = mul(x = var_4784_cast_fp16, y = var_4785_to_fp16)[name = tensor("aw_309_cast_fp16")]; + tensor var_4788_equation_0 = const()[name = tensor("op_4788_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4788_cast_fp16 = einsum(equation = var_4788_equation_0, values = (var_4630_cast_fp16, var_4547_cast_fp16))[name = tensor("op_4788_cast_fp16")]; + tensor var_4789_to_fp16 = const()[name = tensor("op_4789_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_311_cast_fp16 = mul(x = var_4788_cast_fp16, y = var_4789_to_fp16)[name = tensor("aw_311_cast_fp16")]; + tensor var_4792_equation_0 = const()[name = tensor("op_4792_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4792_cast_fp16 = einsum(equation = var_4792_equation_0, values = (var_4634_cast_fp16, var_4551_cast_fp16))[name = tensor("op_4792_cast_fp16")]; + tensor var_4793_to_fp16 = const()[name = tensor("op_4793_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_313_cast_fp16 = mul(x = var_4792_cast_fp16, y = var_4793_to_fp16)[name = tensor("aw_313_cast_fp16")]; + tensor var_4796_equation_0 = const()[name = tensor("op_4796_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4796_cast_fp16 = einsum(equation = var_4796_equation_0, values = (var_4638_cast_fp16, var_4555_cast_fp16))[name = tensor("op_4796_cast_fp16")]; + tensor var_4797_to_fp16 = const()[name = tensor("op_4797_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_315_cast_fp16 = mul(x = var_4796_cast_fp16, y = var_4797_to_fp16)[name = tensor("aw_315_cast_fp16")]; + tensor var_4800_equation_0 = const()[name = tensor("op_4800_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4800_cast_fp16 = einsum(equation = var_4800_equation_0, values = (var_4642_cast_fp16, var_4559_cast_fp16))[name = tensor("op_4800_cast_fp16")]; + tensor var_4801_to_fp16 = const()[name = tensor("op_4801_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_317_cast_fp16 = mul(x = var_4800_cast_fp16, y = var_4801_to_fp16)[name = tensor("aw_317_cast_fp16")]; + tensor var_4804_equation_0 = const()[name = tensor("op_4804_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_4804_cast_fp16 = einsum(equation = var_4804_equation_0, values = (var_4646_cast_fp16, var_4563_cast_fp16))[name = tensor("op_4804_cast_fp16")]; + tensor var_4805_to_fp16 = const()[name = tensor("op_4805_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_319_cast_fp16 = mul(x = var_4804_cast_fp16, y = var_4805_to_fp16)[name = tensor("aw_319_cast_fp16")]; + tensor var_4807_cast_fp16 = softmax(axis = var_4371, x = aw_281_cast_fp16)[name = tensor("op_4807_cast_fp16")]; + tensor var_4808_cast_fp16 = softmax(axis = var_4371, x = aw_283_cast_fp16)[name = tensor("op_4808_cast_fp16")]; + tensor var_4809_cast_fp16 = softmax(axis = var_4371, x = aw_285_cast_fp16)[name = tensor("op_4809_cast_fp16")]; + tensor var_4810_cast_fp16 = softmax(axis = var_4371, x = aw_287_cast_fp16)[name = tensor("op_4810_cast_fp16")]; + tensor var_4811_cast_fp16 = softmax(axis = var_4371, x = aw_289_cast_fp16)[name = tensor("op_4811_cast_fp16")]; + tensor var_4812_cast_fp16 = softmax(axis = var_4371, x = aw_291_cast_fp16)[name = tensor("op_4812_cast_fp16")]; + tensor var_4813_cast_fp16 = softmax(axis = var_4371, x = aw_293_cast_fp16)[name = tensor("op_4813_cast_fp16")]; + tensor var_4814_cast_fp16 = softmax(axis = var_4371, x = aw_295_cast_fp16)[name = tensor("op_4814_cast_fp16")]; + tensor var_4815_cast_fp16 = softmax(axis = var_4371, x = aw_297_cast_fp16)[name = tensor("op_4815_cast_fp16")]; + tensor var_4816_cast_fp16 = softmax(axis = var_4371, x = aw_299_cast_fp16)[name = tensor("op_4816_cast_fp16")]; + tensor var_4817_cast_fp16 = softmax(axis = var_4371, x = aw_301_cast_fp16)[name = tensor("op_4817_cast_fp16")]; + tensor var_4818_cast_fp16 = softmax(axis = var_4371, x = aw_303_cast_fp16)[name = tensor("op_4818_cast_fp16")]; + tensor var_4819_cast_fp16 = softmax(axis = var_4371, x = aw_305_cast_fp16)[name = tensor("op_4819_cast_fp16")]; + tensor var_4820_cast_fp16 = softmax(axis = var_4371, x = aw_307_cast_fp16)[name = tensor("op_4820_cast_fp16")]; + tensor var_4821_cast_fp16 = softmax(axis = var_4371, x = aw_309_cast_fp16)[name = tensor("op_4821_cast_fp16")]; + tensor var_4822_cast_fp16 = softmax(axis = var_4371, x = aw_311_cast_fp16)[name = tensor("op_4822_cast_fp16")]; + tensor var_4823_cast_fp16 = softmax(axis = var_4371, x = aw_313_cast_fp16)[name = tensor("op_4823_cast_fp16")]; + tensor var_4824_cast_fp16 = softmax(axis = var_4371, x = aw_315_cast_fp16)[name = tensor("op_4824_cast_fp16")]; + tensor var_4825_cast_fp16 = softmax(axis = var_4371, x = aw_317_cast_fp16)[name = tensor("op_4825_cast_fp16")]; + tensor var_4826_cast_fp16 = softmax(axis = var_4371, x = aw_319_cast_fp16)[name = tensor("op_4826_cast_fp16")]; + tensor var_4828_equation_0 = const()[name = tensor("op_4828_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4828_cast_fp16 = einsum(equation = var_4828_equation_0, values = (var_4648_cast_fp16, var_4807_cast_fp16))[name = tensor("op_4828_cast_fp16")]; + tensor var_4830_equation_0 = const()[name = tensor("op_4830_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4830_cast_fp16 = einsum(equation = var_4830_equation_0, values = (var_4652_cast_fp16, var_4808_cast_fp16))[name = tensor("op_4830_cast_fp16")]; + tensor var_4832_equation_0 = const()[name = tensor("op_4832_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4832_cast_fp16 = einsum(equation = var_4832_equation_0, values = (var_4656_cast_fp16, var_4809_cast_fp16))[name = tensor("op_4832_cast_fp16")]; + tensor var_4834_equation_0 = const()[name = tensor("op_4834_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4834_cast_fp16 = einsum(equation = var_4834_equation_0, values = (var_4660_cast_fp16, var_4810_cast_fp16))[name = tensor("op_4834_cast_fp16")]; + tensor var_4836_equation_0 = const()[name = tensor("op_4836_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4836_cast_fp16 = einsum(equation = var_4836_equation_0, values = (var_4664_cast_fp16, var_4811_cast_fp16))[name = tensor("op_4836_cast_fp16")]; + tensor var_4838_equation_0 = const()[name = tensor("op_4838_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4838_cast_fp16 = einsum(equation = var_4838_equation_0, values = (var_4668_cast_fp16, var_4812_cast_fp16))[name = tensor("op_4838_cast_fp16")]; + tensor var_4840_equation_0 = const()[name = tensor("op_4840_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4840_cast_fp16 = einsum(equation = var_4840_equation_0, values = (var_4672_cast_fp16, var_4813_cast_fp16))[name = tensor("op_4840_cast_fp16")]; + tensor var_4842_equation_0 = const()[name = tensor("op_4842_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4842_cast_fp16 = einsum(equation = var_4842_equation_0, values = (var_4676_cast_fp16, var_4814_cast_fp16))[name = tensor("op_4842_cast_fp16")]; + tensor var_4844_equation_0 = const()[name = tensor("op_4844_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4844_cast_fp16 = einsum(equation = var_4844_equation_0, values = (var_4680_cast_fp16, var_4815_cast_fp16))[name = tensor("op_4844_cast_fp16")]; + tensor var_4846_equation_0 = const()[name = tensor("op_4846_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4846_cast_fp16 = einsum(equation = var_4846_equation_0, values = (var_4684_cast_fp16, var_4816_cast_fp16))[name = tensor("op_4846_cast_fp16")]; + tensor var_4848_equation_0 = const()[name = tensor("op_4848_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4848_cast_fp16 = einsum(equation = var_4848_equation_0, values = (var_4688_cast_fp16, var_4817_cast_fp16))[name = tensor("op_4848_cast_fp16")]; + tensor var_4850_equation_0 = const()[name = tensor("op_4850_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4850_cast_fp16 = einsum(equation = var_4850_equation_0, values = (var_4692_cast_fp16, var_4818_cast_fp16))[name = tensor("op_4850_cast_fp16")]; + tensor var_4852_equation_0 = const()[name = tensor("op_4852_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4852_cast_fp16 = einsum(equation = var_4852_equation_0, values = (var_4696_cast_fp16, var_4819_cast_fp16))[name = tensor("op_4852_cast_fp16")]; + tensor var_4854_equation_0 = const()[name = tensor("op_4854_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4854_cast_fp16 = einsum(equation = var_4854_equation_0, values = (var_4700_cast_fp16, var_4820_cast_fp16))[name = tensor("op_4854_cast_fp16")]; + tensor var_4856_equation_0 = const()[name = tensor("op_4856_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4856_cast_fp16 = einsum(equation = var_4856_equation_0, values = (var_4704_cast_fp16, var_4821_cast_fp16))[name = tensor("op_4856_cast_fp16")]; + tensor var_4858_equation_0 = const()[name = tensor("op_4858_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4858_cast_fp16 = einsum(equation = var_4858_equation_0, values = (var_4708_cast_fp16, var_4822_cast_fp16))[name = tensor("op_4858_cast_fp16")]; + tensor var_4860_equation_0 = const()[name = tensor("op_4860_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4860_cast_fp16 = einsum(equation = var_4860_equation_0, values = (var_4712_cast_fp16, var_4823_cast_fp16))[name = tensor("op_4860_cast_fp16")]; + tensor var_4862_equation_0 = const()[name = tensor("op_4862_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4862_cast_fp16 = einsum(equation = var_4862_equation_0, values = (var_4716_cast_fp16, var_4824_cast_fp16))[name = tensor("op_4862_cast_fp16")]; + tensor var_4864_equation_0 = const()[name = tensor("op_4864_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4864_cast_fp16 = einsum(equation = var_4864_equation_0, values = (var_4720_cast_fp16, var_4825_cast_fp16))[name = tensor("op_4864_cast_fp16")]; + tensor var_4866_equation_0 = const()[name = tensor("op_4866_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_4866_cast_fp16 = einsum(equation = var_4866_equation_0, values = (var_4724_cast_fp16, var_4826_cast_fp16))[name = tensor("op_4866_cast_fp16")]; + tensor input_215_interleave_0 = const()[name = tensor("input_215_interleave_0"), val = tensor(false)]; + tensor input_215_cast_fp16 = concat(axis = var_4371, interleave = input_215_interleave_0, values = (var_4828_cast_fp16, var_4830_cast_fp16, var_4832_cast_fp16, var_4834_cast_fp16, var_4836_cast_fp16, var_4838_cast_fp16, var_4840_cast_fp16, var_4842_cast_fp16, var_4844_cast_fp16, var_4846_cast_fp16, var_4848_cast_fp16, var_4850_cast_fp16, var_4852_cast_fp16, var_4854_cast_fp16, var_4856_cast_fp16, var_4858_cast_fp16, var_4860_cast_fp16, var_4862_cast_fp16, var_4864_cast_fp16, var_4866_cast_fp16))[name = tensor("input_215_cast_fp16")]; + tensor var_4872 = const()[name = tensor("op_4872"), val = tensor([1, 1])]; + tensor var_4874 = const()[name = tensor("op_4874"), val = tensor([1, 1])]; + tensor var_4876_pad_type_0 = const()[name = tensor("op_4876_pad_type_0"), val = tensor("custom")]; + tensor var_4876_pad_0 = const()[name = tensor("op_4876_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(583361536)))]; + tensor mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(586638400)))]; + tensor var_4876_cast_fp16 = conv(bias = mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_4874, groups = var_4371, pad = var_4876_pad_0, pad_type = var_4876_pad_type_0, strides = var_4872, weight = mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_215_cast_fp16)[name = tensor("op_4876_cast_fp16")]; + tensor inputs_39_cast_fp16 = add(x = var_4876_cast_fp16, y = inputs_37_cast_fp16)[name = tensor("inputs_39_cast_fp16")]; + tensor var_4880 = const()[name = tensor("op_4880"), val = tensor([1])]; + tensor channels_mean_39_cast_fp16 = reduce_mean(axes = var_4880, keep_dims = var_4366, x = inputs_39_cast_fp16)[name = tensor("channels_mean_39_cast_fp16")]; + tensor zero_mean_39_cast_fp16 = sub(x = inputs_39_cast_fp16, y = channels_mean_39_cast_fp16)[name = tensor("zero_mean_39_cast_fp16")]; + tensor zero_mean_sq_39_cast_fp16 = mul(x = zero_mean_39_cast_fp16, y = zero_mean_39_cast_fp16)[name = tensor("zero_mean_sq_39_cast_fp16")]; + tensor var_4884 = const()[name = tensor("op_4884"), val = tensor([1])]; + tensor var_4885_cast_fp16 = reduce_mean(axes = var_4884, keep_dims = var_4366, x = zero_mean_sq_39_cast_fp16)[name = tensor("op_4885_cast_fp16")]; + tensor var_4886_to_fp16 = const()[name = tensor("op_4886_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_4887_cast_fp16 = add(x = var_4885_cast_fp16, y = var_4886_to_fp16)[name = tensor("op_4887_cast_fp16")]; + tensor denom_39_epsilon_0_to_fp16 = const()[name = tensor("denom_39_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_39_cast_fp16 = rsqrt(epsilon = denom_39_epsilon_0_to_fp16, x = var_4887_cast_fp16)[name = tensor("denom_39_cast_fp16")]; + tensor out_39_cast_fp16 = mul(x = zero_mean_39_cast_fp16, y = denom_39_cast_fp16)[name = tensor("out_39_cast_fp16")]; + tensor var_4891_to_fp16 = const()[name = tensor("op_4891_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(586641024)))]; + tensor var_4892_cast_fp16 = add(x = out_39_cast_fp16, y = var_4891_to_fp16)[name = tensor("op_4892_cast_fp16")]; + tensor var_4894_to_fp16 = const()[name = tensor("op_4894_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(586643648)))]; + tensor hidden_states_127_cast_fp16 = mul(x = var_4892_cast_fp16, y = var_4894_to_fp16)[name = tensor("hidden_states_127_cast_fp16")]; + tensor var_4901 = const()[name = tensor("op_4901"), val = tensor([1, 1])]; + tensor var_4903 = const()[name = tensor("op_4903"), val = tensor([1, 1])]; + tensor q_27_pad_type_0 = const()[name = tensor("q_27_pad_type_0"), val = tensor("custom")]; + tensor q_27_pad_0 = const()[name = tensor("q_27_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(586646272)))]; + tensor q_27_cast_fp16 = conv(dilations = var_4903, groups = var_4371, pad = q_27_pad_0, pad_type = q_27_pad_type_0, strides = var_4901, weight = mid_block_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_127_cast_fp16)[name = tensor("q_27_cast_fp16")]; + tensor var_4907 = const()[name = tensor("op_4907"), val = tensor([1, 1])]; + tensor var_4909 = const()[name = tensor("op_4909"), val = tensor([1, 1])]; + tensor k_53_pad_type_0 = const()[name = tensor("k_53_pad_type_0"), val = tensor("custom")]; + tensor k_53_pad_0 = const()[name = tensor("k_53_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589923136)))]; + tensor k_53_cast_fp16 = conv(dilations = var_4909, groups = var_4371, pad = k_53_pad_0, pad_type = k_53_pad_type_0, strides = var_4907, weight = mid_block_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_53_cast_fp16")]; + tensor var_4913 = const()[name = tensor("op_4913"), val = tensor([1, 1])]; + tensor var_4915 = const()[name = tensor("op_4915"), val = tensor([1, 1])]; + tensor v_27_pad_type_0 = const()[name = tensor("v_27_pad_type_0"), val = tensor("custom")]; + tensor v_27_pad_0 = const()[name = tensor("v_27_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(592544640)))]; + tensor v_27_cast_fp16 = conv(dilations = var_4915, groups = var_4371, pad = v_27_pad_0, pad_type = v_27_pad_type_0, strides = var_4913, weight = mid_block_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_27_cast_fp16")]; + tensor var_4919_begin_0 = const()[name = tensor("op_4919_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_4919_end_0 = const()[name = tensor("op_4919_end_0"), val = tensor([2, 64, 1, 36])]; + tensor var_4919_end_mask_0 = const()[name = tensor("op_4919_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4919_cast_fp16 = slice_by_index(begin = var_4919_begin_0, end = var_4919_end_0, end_mask = var_4919_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4919_cast_fp16")]; + tensor var_4923_begin_0 = const()[name = tensor("op_4923_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_4923_end_0 = const()[name = tensor("op_4923_end_0"), val = tensor([2, 128, 1, 36])]; + tensor var_4923_end_mask_0 = const()[name = tensor("op_4923_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4923_cast_fp16 = slice_by_index(begin = var_4923_begin_0, end = var_4923_end_0, end_mask = var_4923_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4923_cast_fp16")]; + tensor var_4927_begin_0 = const()[name = tensor("op_4927_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_4927_end_0 = const()[name = tensor("op_4927_end_0"), val = tensor([2, 192, 1, 36])]; + tensor var_4927_end_mask_0 = const()[name = tensor("op_4927_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4927_cast_fp16 = slice_by_index(begin = var_4927_begin_0, end = var_4927_end_0, end_mask = var_4927_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4927_cast_fp16")]; + tensor var_4931_begin_0 = const()[name = tensor("op_4931_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_4931_end_0 = const()[name = tensor("op_4931_end_0"), val = tensor([2, 256, 1, 36])]; + tensor var_4931_end_mask_0 = const()[name = tensor("op_4931_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4931_cast_fp16 = slice_by_index(begin = var_4931_begin_0, end = var_4931_end_0, end_mask = var_4931_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4931_cast_fp16")]; + tensor var_4935_begin_0 = const()[name = tensor("op_4935_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_4935_end_0 = const()[name = tensor("op_4935_end_0"), val = tensor([2, 320, 1, 36])]; + tensor var_4935_end_mask_0 = const()[name = tensor("op_4935_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4935_cast_fp16 = slice_by_index(begin = var_4935_begin_0, end = var_4935_end_0, end_mask = var_4935_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4935_cast_fp16")]; + tensor var_4939_begin_0 = const()[name = tensor("op_4939_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_4939_end_0 = const()[name = tensor("op_4939_end_0"), val = tensor([2, 384, 1, 36])]; + tensor var_4939_end_mask_0 = const()[name = tensor("op_4939_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4939_cast_fp16 = slice_by_index(begin = var_4939_begin_0, end = var_4939_end_0, end_mask = var_4939_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4939_cast_fp16")]; + tensor var_4943_begin_0 = const()[name = tensor("op_4943_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_4943_end_0 = const()[name = tensor("op_4943_end_0"), val = tensor([2, 448, 1, 36])]; + tensor var_4943_end_mask_0 = const()[name = tensor("op_4943_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4943_cast_fp16 = slice_by_index(begin = var_4943_begin_0, end = var_4943_end_0, end_mask = var_4943_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4943_cast_fp16")]; + tensor var_4947_begin_0 = const()[name = tensor("op_4947_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_4947_end_0 = const()[name = tensor("op_4947_end_0"), val = tensor([2, 512, 1, 36])]; + tensor var_4947_end_mask_0 = const()[name = tensor("op_4947_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4947_cast_fp16 = slice_by_index(begin = var_4947_begin_0, end = var_4947_end_0, end_mask = var_4947_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4947_cast_fp16")]; + tensor var_4951_begin_0 = const()[name = tensor("op_4951_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_4951_end_0 = const()[name = tensor("op_4951_end_0"), val = tensor([2, 576, 1, 36])]; + tensor var_4951_end_mask_0 = const()[name = tensor("op_4951_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4951_cast_fp16 = slice_by_index(begin = var_4951_begin_0, end = var_4951_end_0, end_mask = var_4951_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4951_cast_fp16")]; + tensor var_4955_begin_0 = const()[name = tensor("op_4955_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_4955_end_0 = const()[name = tensor("op_4955_end_0"), val = tensor([2, 640, 1, 36])]; + tensor var_4955_end_mask_0 = const()[name = tensor("op_4955_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4955_cast_fp16 = slice_by_index(begin = var_4955_begin_0, end = var_4955_end_0, end_mask = var_4955_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4955_cast_fp16")]; + tensor var_4959_begin_0 = const()[name = tensor("op_4959_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_4959_end_0 = const()[name = tensor("op_4959_end_0"), val = tensor([2, 704, 1, 36])]; + tensor var_4959_end_mask_0 = const()[name = tensor("op_4959_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4959_cast_fp16 = slice_by_index(begin = var_4959_begin_0, end = var_4959_end_0, end_mask = var_4959_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4959_cast_fp16")]; + tensor var_4963_begin_0 = const()[name = tensor("op_4963_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_4963_end_0 = const()[name = tensor("op_4963_end_0"), val = tensor([2, 768, 1, 36])]; + tensor var_4963_end_mask_0 = const()[name = tensor("op_4963_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4963_cast_fp16 = slice_by_index(begin = var_4963_begin_0, end = var_4963_end_0, end_mask = var_4963_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4963_cast_fp16")]; + tensor var_4967_begin_0 = const()[name = tensor("op_4967_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_4967_end_0 = const()[name = tensor("op_4967_end_0"), val = tensor([2, 832, 1, 36])]; + tensor var_4967_end_mask_0 = const()[name = tensor("op_4967_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4967_cast_fp16 = slice_by_index(begin = var_4967_begin_0, end = var_4967_end_0, end_mask = var_4967_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4967_cast_fp16")]; + tensor var_4971_begin_0 = const()[name = tensor("op_4971_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_4971_end_0 = const()[name = tensor("op_4971_end_0"), val = tensor([2, 896, 1, 36])]; + tensor var_4971_end_mask_0 = const()[name = tensor("op_4971_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4971_cast_fp16 = slice_by_index(begin = var_4971_begin_0, end = var_4971_end_0, end_mask = var_4971_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4971_cast_fp16")]; + tensor var_4975_begin_0 = const()[name = tensor("op_4975_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_4975_end_0 = const()[name = tensor("op_4975_end_0"), val = tensor([2, 960, 1, 36])]; + tensor var_4975_end_mask_0 = const()[name = tensor("op_4975_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4975_cast_fp16 = slice_by_index(begin = var_4975_begin_0, end = var_4975_end_0, end_mask = var_4975_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4975_cast_fp16")]; + tensor var_4979_begin_0 = const()[name = tensor("op_4979_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_4979_end_0 = const()[name = tensor("op_4979_end_0"), val = tensor([2, 1024, 1, 36])]; + tensor var_4979_end_mask_0 = const()[name = tensor("op_4979_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4979_cast_fp16 = slice_by_index(begin = var_4979_begin_0, end = var_4979_end_0, end_mask = var_4979_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4979_cast_fp16")]; + tensor var_4983_begin_0 = const()[name = tensor("op_4983_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_4983_end_0 = const()[name = tensor("op_4983_end_0"), val = tensor([2, 1088, 1, 36])]; + tensor var_4983_end_mask_0 = const()[name = tensor("op_4983_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4983_cast_fp16 = slice_by_index(begin = var_4983_begin_0, end = var_4983_end_0, end_mask = var_4983_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4983_cast_fp16")]; + tensor var_4987_begin_0 = const()[name = tensor("op_4987_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_4987_end_0 = const()[name = tensor("op_4987_end_0"), val = tensor([2, 1152, 1, 36])]; + tensor var_4987_end_mask_0 = const()[name = tensor("op_4987_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4987_cast_fp16 = slice_by_index(begin = var_4987_begin_0, end = var_4987_end_0, end_mask = var_4987_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4987_cast_fp16")]; + tensor var_4991_begin_0 = const()[name = tensor("op_4991_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_4991_end_0 = const()[name = tensor("op_4991_end_0"), val = tensor([2, 1216, 1, 36])]; + tensor var_4991_end_mask_0 = const()[name = tensor("op_4991_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4991_cast_fp16 = slice_by_index(begin = var_4991_begin_0, end = var_4991_end_0, end_mask = var_4991_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4991_cast_fp16")]; + tensor var_4995_begin_0 = const()[name = tensor("op_4995_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_4995_end_0 = const()[name = tensor("op_4995_end_0"), val = tensor([2, 1280, 1, 36])]; + tensor var_4995_end_mask_0 = const()[name = tensor("op_4995_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_4995_cast_fp16 = slice_by_index(begin = var_4995_begin_0, end = var_4995_end_0, end_mask = var_4995_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4995_cast_fp16")]; + tensor k_55_perm_0 = const()[name = tensor("k_55_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_5002_begin_0 = const()[name = tensor("op_5002_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_5002_end_0 = const()[name = tensor("op_5002_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_5002_end_mask_0 = const()[name = tensor("op_5002_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_18 = transpose(perm = k_55_perm_0, x = k_53_cast_fp16)[name = tensor("transpose_18")]; + tensor var_5002_cast_fp16 = slice_by_index(begin = var_5002_begin_0, end = var_5002_end_0, end_mask = var_5002_end_mask_0, x = transpose_18)[name = tensor("op_5002_cast_fp16")]; + tensor var_5006_begin_0 = const()[name = tensor("op_5006_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_5006_end_0 = const()[name = tensor("op_5006_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_5006_end_mask_0 = const()[name = tensor("op_5006_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5006_cast_fp16 = slice_by_index(begin = var_5006_begin_0, end = var_5006_end_0, end_mask = var_5006_end_mask_0, x = transpose_18)[name = tensor("op_5006_cast_fp16")]; + tensor var_5010_begin_0 = const()[name = tensor("op_5010_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_5010_end_0 = const()[name = tensor("op_5010_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_5010_end_mask_0 = const()[name = tensor("op_5010_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5010_cast_fp16 = slice_by_index(begin = var_5010_begin_0, end = var_5010_end_0, end_mask = var_5010_end_mask_0, x = transpose_18)[name = tensor("op_5010_cast_fp16")]; + tensor var_5014_begin_0 = const()[name = tensor("op_5014_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_5014_end_0 = const()[name = tensor("op_5014_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_5014_end_mask_0 = const()[name = tensor("op_5014_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5014_cast_fp16 = slice_by_index(begin = var_5014_begin_0, end = var_5014_end_0, end_mask = var_5014_end_mask_0, x = transpose_18)[name = tensor("op_5014_cast_fp16")]; + tensor var_5018_begin_0 = const()[name = tensor("op_5018_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_5018_end_0 = const()[name = tensor("op_5018_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_5018_end_mask_0 = const()[name = tensor("op_5018_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5018_cast_fp16 = slice_by_index(begin = var_5018_begin_0, end = var_5018_end_0, end_mask = var_5018_end_mask_0, x = transpose_18)[name = tensor("op_5018_cast_fp16")]; + tensor var_5022_begin_0 = const()[name = tensor("op_5022_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_5022_end_0 = const()[name = tensor("op_5022_end_0"), val = tensor([2, 77, 1, 384])]; + tensor var_5022_end_mask_0 = const()[name = tensor("op_5022_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5022_cast_fp16 = slice_by_index(begin = var_5022_begin_0, end = var_5022_end_0, end_mask = var_5022_end_mask_0, x = transpose_18)[name = tensor("op_5022_cast_fp16")]; + tensor var_5026_begin_0 = const()[name = tensor("op_5026_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_5026_end_0 = const()[name = tensor("op_5026_end_0"), val = tensor([2, 77, 1, 448])]; + tensor var_5026_end_mask_0 = const()[name = tensor("op_5026_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5026_cast_fp16 = slice_by_index(begin = var_5026_begin_0, end = var_5026_end_0, end_mask = var_5026_end_mask_0, x = transpose_18)[name = tensor("op_5026_cast_fp16")]; + tensor var_5030_begin_0 = const()[name = tensor("op_5030_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_5030_end_0 = const()[name = tensor("op_5030_end_0"), val = tensor([2, 77, 1, 512])]; + tensor var_5030_end_mask_0 = const()[name = tensor("op_5030_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5030_cast_fp16 = slice_by_index(begin = var_5030_begin_0, end = var_5030_end_0, end_mask = var_5030_end_mask_0, x = transpose_18)[name = tensor("op_5030_cast_fp16")]; + tensor var_5034_begin_0 = const()[name = tensor("op_5034_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_5034_end_0 = const()[name = tensor("op_5034_end_0"), val = tensor([2, 77, 1, 576])]; + tensor var_5034_end_mask_0 = const()[name = tensor("op_5034_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5034_cast_fp16 = slice_by_index(begin = var_5034_begin_0, end = var_5034_end_0, end_mask = var_5034_end_mask_0, x = transpose_18)[name = tensor("op_5034_cast_fp16")]; + tensor var_5038_begin_0 = const()[name = tensor("op_5038_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_5038_end_0 = const()[name = tensor("op_5038_end_0"), val = tensor([2, 77, 1, 640])]; + tensor var_5038_end_mask_0 = const()[name = tensor("op_5038_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5038_cast_fp16 = slice_by_index(begin = var_5038_begin_0, end = var_5038_end_0, end_mask = var_5038_end_mask_0, x = transpose_18)[name = tensor("op_5038_cast_fp16")]; + tensor var_5042_begin_0 = const()[name = tensor("op_5042_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_5042_end_0 = const()[name = tensor("op_5042_end_0"), val = tensor([2, 77, 1, 704])]; + tensor var_5042_end_mask_0 = const()[name = tensor("op_5042_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5042_cast_fp16 = slice_by_index(begin = var_5042_begin_0, end = var_5042_end_0, end_mask = var_5042_end_mask_0, x = transpose_18)[name = tensor("op_5042_cast_fp16")]; + tensor var_5046_begin_0 = const()[name = tensor("op_5046_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_5046_end_0 = const()[name = tensor("op_5046_end_0"), val = tensor([2, 77, 1, 768])]; + tensor var_5046_end_mask_0 = const()[name = tensor("op_5046_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5046_cast_fp16 = slice_by_index(begin = var_5046_begin_0, end = var_5046_end_0, end_mask = var_5046_end_mask_0, x = transpose_18)[name = tensor("op_5046_cast_fp16")]; + tensor var_5050_begin_0 = const()[name = tensor("op_5050_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_5050_end_0 = const()[name = tensor("op_5050_end_0"), val = tensor([2, 77, 1, 832])]; + tensor var_5050_end_mask_0 = const()[name = tensor("op_5050_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5050_cast_fp16 = slice_by_index(begin = var_5050_begin_0, end = var_5050_end_0, end_mask = var_5050_end_mask_0, x = transpose_18)[name = tensor("op_5050_cast_fp16")]; + tensor var_5054_begin_0 = const()[name = tensor("op_5054_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_5054_end_0 = const()[name = tensor("op_5054_end_0"), val = tensor([2, 77, 1, 896])]; + tensor var_5054_end_mask_0 = const()[name = tensor("op_5054_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5054_cast_fp16 = slice_by_index(begin = var_5054_begin_0, end = var_5054_end_0, end_mask = var_5054_end_mask_0, x = transpose_18)[name = tensor("op_5054_cast_fp16")]; + tensor var_5058_begin_0 = const()[name = tensor("op_5058_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_5058_end_0 = const()[name = tensor("op_5058_end_0"), val = tensor([2, 77, 1, 960])]; + tensor var_5058_end_mask_0 = const()[name = tensor("op_5058_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5058_cast_fp16 = slice_by_index(begin = var_5058_begin_0, end = var_5058_end_0, end_mask = var_5058_end_mask_0, x = transpose_18)[name = tensor("op_5058_cast_fp16")]; + tensor var_5062_begin_0 = const()[name = tensor("op_5062_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_5062_end_0 = const()[name = tensor("op_5062_end_0"), val = tensor([2, 77, 1, 1024])]; + tensor var_5062_end_mask_0 = const()[name = tensor("op_5062_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5062_cast_fp16 = slice_by_index(begin = var_5062_begin_0, end = var_5062_end_0, end_mask = var_5062_end_mask_0, x = transpose_18)[name = tensor("op_5062_cast_fp16")]; + tensor var_5066_begin_0 = const()[name = tensor("op_5066_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_5066_end_0 = const()[name = tensor("op_5066_end_0"), val = tensor([2, 77, 1, 1088])]; + tensor var_5066_end_mask_0 = const()[name = tensor("op_5066_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5066_cast_fp16 = slice_by_index(begin = var_5066_begin_0, end = var_5066_end_0, end_mask = var_5066_end_mask_0, x = transpose_18)[name = tensor("op_5066_cast_fp16")]; + tensor var_5070_begin_0 = const()[name = tensor("op_5070_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_5070_end_0 = const()[name = tensor("op_5070_end_0"), val = tensor([2, 77, 1, 1152])]; + tensor var_5070_end_mask_0 = const()[name = tensor("op_5070_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5070_cast_fp16 = slice_by_index(begin = var_5070_begin_0, end = var_5070_end_0, end_mask = var_5070_end_mask_0, x = transpose_18)[name = tensor("op_5070_cast_fp16")]; + tensor var_5074_begin_0 = const()[name = tensor("op_5074_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_5074_end_0 = const()[name = tensor("op_5074_end_0"), val = tensor([2, 77, 1, 1216])]; + tensor var_5074_end_mask_0 = const()[name = tensor("op_5074_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5074_cast_fp16 = slice_by_index(begin = var_5074_begin_0, end = var_5074_end_0, end_mask = var_5074_end_mask_0, x = transpose_18)[name = tensor("op_5074_cast_fp16")]; + tensor var_5078_begin_0 = const()[name = tensor("op_5078_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_5078_end_0 = const()[name = tensor("op_5078_end_0"), val = tensor([2, 77, 1, 1280])]; + tensor var_5078_end_mask_0 = const()[name = tensor("op_5078_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5078_cast_fp16 = slice_by_index(begin = var_5078_begin_0, end = var_5078_end_0, end_mask = var_5078_end_mask_0, x = transpose_18)[name = tensor("op_5078_cast_fp16")]; + tensor var_5080_begin_0 = const()[name = tensor("op_5080_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_5080_end_0 = const()[name = tensor("op_5080_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_5080_end_mask_0 = const()[name = tensor("op_5080_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5080_cast_fp16 = slice_by_index(begin = var_5080_begin_0, end = var_5080_end_0, end_mask = var_5080_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5080_cast_fp16")]; + tensor var_5084_begin_0 = const()[name = tensor("op_5084_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_5084_end_0 = const()[name = tensor("op_5084_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_5084_end_mask_0 = const()[name = tensor("op_5084_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5084_cast_fp16 = slice_by_index(begin = var_5084_begin_0, end = var_5084_end_0, end_mask = var_5084_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5084_cast_fp16")]; + tensor var_5088_begin_0 = const()[name = tensor("op_5088_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_5088_end_0 = const()[name = tensor("op_5088_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_5088_end_mask_0 = const()[name = tensor("op_5088_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5088_cast_fp16 = slice_by_index(begin = var_5088_begin_0, end = var_5088_end_0, end_mask = var_5088_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5088_cast_fp16")]; + tensor var_5092_begin_0 = const()[name = tensor("op_5092_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_5092_end_0 = const()[name = tensor("op_5092_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_5092_end_mask_0 = const()[name = tensor("op_5092_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5092_cast_fp16 = slice_by_index(begin = var_5092_begin_0, end = var_5092_end_0, end_mask = var_5092_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5092_cast_fp16")]; + tensor var_5096_begin_0 = const()[name = tensor("op_5096_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_5096_end_0 = const()[name = tensor("op_5096_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_5096_end_mask_0 = const()[name = tensor("op_5096_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5096_cast_fp16 = slice_by_index(begin = var_5096_begin_0, end = var_5096_end_0, end_mask = var_5096_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5096_cast_fp16")]; + tensor var_5100_begin_0 = const()[name = tensor("op_5100_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_5100_end_0 = const()[name = tensor("op_5100_end_0"), val = tensor([2, 384, 1, 77])]; + tensor var_5100_end_mask_0 = const()[name = tensor("op_5100_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5100_cast_fp16 = slice_by_index(begin = var_5100_begin_0, end = var_5100_end_0, end_mask = var_5100_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5100_cast_fp16")]; + tensor var_5104_begin_0 = const()[name = tensor("op_5104_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_5104_end_0 = const()[name = tensor("op_5104_end_0"), val = tensor([2, 448, 1, 77])]; + tensor var_5104_end_mask_0 = const()[name = tensor("op_5104_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5104_cast_fp16 = slice_by_index(begin = var_5104_begin_0, end = var_5104_end_0, end_mask = var_5104_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5104_cast_fp16")]; + tensor var_5108_begin_0 = const()[name = tensor("op_5108_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_5108_end_0 = const()[name = tensor("op_5108_end_0"), val = tensor([2, 512, 1, 77])]; + tensor var_5108_end_mask_0 = const()[name = tensor("op_5108_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5108_cast_fp16 = slice_by_index(begin = var_5108_begin_0, end = var_5108_end_0, end_mask = var_5108_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5108_cast_fp16")]; + tensor var_5112_begin_0 = const()[name = tensor("op_5112_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_5112_end_0 = const()[name = tensor("op_5112_end_0"), val = tensor([2, 576, 1, 77])]; + tensor var_5112_end_mask_0 = const()[name = tensor("op_5112_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5112_cast_fp16 = slice_by_index(begin = var_5112_begin_0, end = var_5112_end_0, end_mask = var_5112_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5112_cast_fp16")]; + tensor var_5116_begin_0 = const()[name = tensor("op_5116_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_5116_end_0 = const()[name = tensor("op_5116_end_0"), val = tensor([2, 640, 1, 77])]; + tensor var_5116_end_mask_0 = const()[name = tensor("op_5116_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5116_cast_fp16 = slice_by_index(begin = var_5116_begin_0, end = var_5116_end_0, end_mask = var_5116_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5116_cast_fp16")]; + tensor var_5120_begin_0 = const()[name = tensor("op_5120_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_5120_end_0 = const()[name = tensor("op_5120_end_0"), val = tensor([2, 704, 1, 77])]; + tensor var_5120_end_mask_0 = const()[name = tensor("op_5120_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5120_cast_fp16 = slice_by_index(begin = var_5120_begin_0, end = var_5120_end_0, end_mask = var_5120_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5120_cast_fp16")]; + tensor var_5124_begin_0 = const()[name = tensor("op_5124_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_5124_end_0 = const()[name = tensor("op_5124_end_0"), val = tensor([2, 768, 1, 77])]; + tensor var_5124_end_mask_0 = const()[name = tensor("op_5124_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5124_cast_fp16 = slice_by_index(begin = var_5124_begin_0, end = var_5124_end_0, end_mask = var_5124_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5124_cast_fp16")]; + tensor var_5128_begin_0 = const()[name = tensor("op_5128_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_5128_end_0 = const()[name = tensor("op_5128_end_0"), val = tensor([2, 832, 1, 77])]; + tensor var_5128_end_mask_0 = const()[name = tensor("op_5128_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5128_cast_fp16 = slice_by_index(begin = var_5128_begin_0, end = var_5128_end_0, end_mask = var_5128_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5128_cast_fp16")]; + tensor var_5132_begin_0 = const()[name = tensor("op_5132_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_5132_end_0 = const()[name = tensor("op_5132_end_0"), val = tensor([2, 896, 1, 77])]; + tensor var_5132_end_mask_0 = const()[name = tensor("op_5132_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5132_cast_fp16 = slice_by_index(begin = var_5132_begin_0, end = var_5132_end_0, end_mask = var_5132_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5132_cast_fp16")]; + tensor var_5136_begin_0 = const()[name = tensor("op_5136_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_5136_end_0 = const()[name = tensor("op_5136_end_0"), val = tensor([2, 960, 1, 77])]; + tensor var_5136_end_mask_0 = const()[name = tensor("op_5136_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5136_cast_fp16 = slice_by_index(begin = var_5136_begin_0, end = var_5136_end_0, end_mask = var_5136_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5136_cast_fp16")]; + tensor var_5140_begin_0 = const()[name = tensor("op_5140_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_5140_end_0 = const()[name = tensor("op_5140_end_0"), val = tensor([2, 1024, 1, 77])]; + tensor var_5140_end_mask_0 = const()[name = tensor("op_5140_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5140_cast_fp16 = slice_by_index(begin = var_5140_begin_0, end = var_5140_end_0, end_mask = var_5140_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5140_cast_fp16")]; + tensor var_5144_begin_0 = const()[name = tensor("op_5144_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_5144_end_0 = const()[name = tensor("op_5144_end_0"), val = tensor([2, 1088, 1, 77])]; + tensor var_5144_end_mask_0 = const()[name = tensor("op_5144_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5144_cast_fp16 = slice_by_index(begin = var_5144_begin_0, end = var_5144_end_0, end_mask = var_5144_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5144_cast_fp16")]; + tensor var_5148_begin_0 = const()[name = tensor("op_5148_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_5148_end_0 = const()[name = tensor("op_5148_end_0"), val = tensor([2, 1152, 1, 77])]; + tensor var_5148_end_mask_0 = const()[name = tensor("op_5148_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5148_cast_fp16 = slice_by_index(begin = var_5148_begin_0, end = var_5148_end_0, end_mask = var_5148_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5148_cast_fp16")]; + tensor var_5152_begin_0 = const()[name = tensor("op_5152_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_5152_end_0 = const()[name = tensor("op_5152_end_0"), val = tensor([2, 1216, 1, 77])]; + tensor var_5152_end_mask_0 = const()[name = tensor("op_5152_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5152_cast_fp16 = slice_by_index(begin = var_5152_begin_0, end = var_5152_end_0, end_mask = var_5152_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5152_cast_fp16")]; + tensor var_5156_begin_0 = const()[name = tensor("op_5156_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_5156_end_0 = const()[name = tensor("op_5156_end_0"), val = tensor([2, 1280, 1, 77])]; + tensor var_5156_end_mask_0 = const()[name = tensor("op_5156_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5156_cast_fp16 = slice_by_index(begin = var_5156_begin_0, end = var_5156_end_0, end_mask = var_5156_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5156_cast_fp16")]; + tensor var_5160_equation_0 = const()[name = tensor("op_5160_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5160_cast_fp16 = einsum(equation = var_5160_equation_0, values = (var_5002_cast_fp16, var_4919_cast_fp16))[name = tensor("op_5160_cast_fp16")]; + tensor var_5161_to_fp16 = const()[name = tensor("op_5161_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_321_cast_fp16 = mul(x = var_5160_cast_fp16, y = var_5161_to_fp16)[name = tensor("aw_321_cast_fp16")]; + tensor var_5164_equation_0 = const()[name = tensor("op_5164_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5164_cast_fp16 = einsum(equation = var_5164_equation_0, values = (var_5006_cast_fp16, var_4923_cast_fp16))[name = tensor("op_5164_cast_fp16")]; + tensor var_5165_to_fp16 = const()[name = tensor("op_5165_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_323_cast_fp16 = mul(x = var_5164_cast_fp16, y = var_5165_to_fp16)[name = tensor("aw_323_cast_fp16")]; + tensor var_5168_equation_0 = const()[name = tensor("op_5168_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5168_cast_fp16 = einsum(equation = var_5168_equation_0, values = (var_5010_cast_fp16, var_4927_cast_fp16))[name = tensor("op_5168_cast_fp16")]; + tensor var_5169_to_fp16 = const()[name = tensor("op_5169_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_325_cast_fp16 = mul(x = var_5168_cast_fp16, y = var_5169_to_fp16)[name = tensor("aw_325_cast_fp16")]; + tensor var_5172_equation_0 = const()[name = tensor("op_5172_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5172_cast_fp16 = einsum(equation = var_5172_equation_0, values = (var_5014_cast_fp16, var_4931_cast_fp16))[name = tensor("op_5172_cast_fp16")]; + tensor var_5173_to_fp16 = const()[name = tensor("op_5173_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_327_cast_fp16 = mul(x = var_5172_cast_fp16, y = var_5173_to_fp16)[name = tensor("aw_327_cast_fp16")]; + tensor var_5176_equation_0 = const()[name = tensor("op_5176_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5176_cast_fp16 = einsum(equation = var_5176_equation_0, values = (var_5018_cast_fp16, var_4935_cast_fp16))[name = tensor("op_5176_cast_fp16")]; + tensor var_5177_to_fp16 = const()[name = tensor("op_5177_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_329_cast_fp16 = mul(x = var_5176_cast_fp16, y = var_5177_to_fp16)[name = tensor("aw_329_cast_fp16")]; + tensor var_5180_equation_0 = const()[name = tensor("op_5180_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5180_cast_fp16 = einsum(equation = var_5180_equation_0, values = (var_5022_cast_fp16, var_4939_cast_fp16))[name = tensor("op_5180_cast_fp16")]; + tensor var_5181_to_fp16 = const()[name = tensor("op_5181_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_331_cast_fp16 = mul(x = var_5180_cast_fp16, y = var_5181_to_fp16)[name = tensor("aw_331_cast_fp16")]; + tensor var_5184_equation_0 = const()[name = tensor("op_5184_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5184_cast_fp16 = einsum(equation = var_5184_equation_0, values = (var_5026_cast_fp16, var_4943_cast_fp16))[name = tensor("op_5184_cast_fp16")]; + tensor var_5185_to_fp16 = const()[name = tensor("op_5185_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_333_cast_fp16 = mul(x = var_5184_cast_fp16, y = var_5185_to_fp16)[name = tensor("aw_333_cast_fp16")]; + tensor var_5188_equation_0 = const()[name = tensor("op_5188_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5188_cast_fp16 = einsum(equation = var_5188_equation_0, values = (var_5030_cast_fp16, var_4947_cast_fp16))[name = tensor("op_5188_cast_fp16")]; + tensor var_5189_to_fp16 = const()[name = tensor("op_5189_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_335_cast_fp16 = mul(x = var_5188_cast_fp16, y = var_5189_to_fp16)[name = tensor("aw_335_cast_fp16")]; + tensor var_5192_equation_0 = const()[name = tensor("op_5192_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5192_cast_fp16 = einsum(equation = var_5192_equation_0, values = (var_5034_cast_fp16, var_4951_cast_fp16))[name = tensor("op_5192_cast_fp16")]; + tensor var_5193_to_fp16 = const()[name = tensor("op_5193_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_337_cast_fp16 = mul(x = var_5192_cast_fp16, y = var_5193_to_fp16)[name = tensor("aw_337_cast_fp16")]; + tensor var_5196_equation_0 = const()[name = tensor("op_5196_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5196_cast_fp16 = einsum(equation = var_5196_equation_0, values = (var_5038_cast_fp16, var_4955_cast_fp16))[name = tensor("op_5196_cast_fp16")]; + tensor var_5197_to_fp16 = const()[name = tensor("op_5197_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_339_cast_fp16 = mul(x = var_5196_cast_fp16, y = var_5197_to_fp16)[name = tensor("aw_339_cast_fp16")]; + tensor var_5200_equation_0 = const()[name = tensor("op_5200_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5200_cast_fp16 = einsum(equation = var_5200_equation_0, values = (var_5042_cast_fp16, var_4959_cast_fp16))[name = tensor("op_5200_cast_fp16")]; + tensor var_5201_to_fp16 = const()[name = tensor("op_5201_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_341_cast_fp16 = mul(x = var_5200_cast_fp16, y = var_5201_to_fp16)[name = tensor("aw_341_cast_fp16")]; + tensor var_5204_equation_0 = const()[name = tensor("op_5204_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5204_cast_fp16 = einsum(equation = var_5204_equation_0, values = (var_5046_cast_fp16, var_4963_cast_fp16))[name = tensor("op_5204_cast_fp16")]; + tensor var_5205_to_fp16 = const()[name = tensor("op_5205_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_343_cast_fp16 = mul(x = var_5204_cast_fp16, y = var_5205_to_fp16)[name = tensor("aw_343_cast_fp16")]; + tensor var_5208_equation_0 = const()[name = tensor("op_5208_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5208_cast_fp16 = einsum(equation = var_5208_equation_0, values = (var_5050_cast_fp16, var_4967_cast_fp16))[name = tensor("op_5208_cast_fp16")]; + tensor var_5209_to_fp16 = const()[name = tensor("op_5209_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_345_cast_fp16 = mul(x = var_5208_cast_fp16, y = var_5209_to_fp16)[name = tensor("aw_345_cast_fp16")]; + tensor var_5212_equation_0 = const()[name = tensor("op_5212_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5212_cast_fp16 = einsum(equation = var_5212_equation_0, values = (var_5054_cast_fp16, var_4971_cast_fp16))[name = tensor("op_5212_cast_fp16")]; + tensor var_5213_to_fp16 = const()[name = tensor("op_5213_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_347_cast_fp16 = mul(x = var_5212_cast_fp16, y = var_5213_to_fp16)[name = tensor("aw_347_cast_fp16")]; + tensor var_5216_equation_0 = const()[name = tensor("op_5216_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5216_cast_fp16 = einsum(equation = var_5216_equation_0, values = (var_5058_cast_fp16, var_4975_cast_fp16))[name = tensor("op_5216_cast_fp16")]; + tensor var_5217_to_fp16 = const()[name = tensor("op_5217_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_349_cast_fp16 = mul(x = var_5216_cast_fp16, y = var_5217_to_fp16)[name = tensor("aw_349_cast_fp16")]; + tensor var_5220_equation_0 = const()[name = tensor("op_5220_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5220_cast_fp16 = einsum(equation = var_5220_equation_0, values = (var_5062_cast_fp16, var_4979_cast_fp16))[name = tensor("op_5220_cast_fp16")]; + tensor var_5221_to_fp16 = const()[name = tensor("op_5221_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_351_cast_fp16 = mul(x = var_5220_cast_fp16, y = var_5221_to_fp16)[name = tensor("aw_351_cast_fp16")]; + tensor var_5224_equation_0 = const()[name = tensor("op_5224_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5224_cast_fp16 = einsum(equation = var_5224_equation_0, values = (var_5066_cast_fp16, var_4983_cast_fp16))[name = tensor("op_5224_cast_fp16")]; + tensor var_5225_to_fp16 = const()[name = tensor("op_5225_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_353_cast_fp16 = mul(x = var_5224_cast_fp16, y = var_5225_to_fp16)[name = tensor("aw_353_cast_fp16")]; + tensor var_5228_equation_0 = const()[name = tensor("op_5228_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5228_cast_fp16 = einsum(equation = var_5228_equation_0, values = (var_5070_cast_fp16, var_4987_cast_fp16))[name = tensor("op_5228_cast_fp16")]; + tensor var_5229_to_fp16 = const()[name = tensor("op_5229_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_355_cast_fp16 = mul(x = var_5228_cast_fp16, y = var_5229_to_fp16)[name = tensor("aw_355_cast_fp16")]; + tensor var_5232_equation_0 = const()[name = tensor("op_5232_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5232_cast_fp16 = einsum(equation = var_5232_equation_0, values = (var_5074_cast_fp16, var_4991_cast_fp16))[name = tensor("op_5232_cast_fp16")]; + tensor var_5233_to_fp16 = const()[name = tensor("op_5233_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_357_cast_fp16 = mul(x = var_5232_cast_fp16, y = var_5233_to_fp16)[name = tensor("aw_357_cast_fp16")]; + tensor var_5236_equation_0 = const()[name = tensor("op_5236_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5236_cast_fp16 = einsum(equation = var_5236_equation_0, values = (var_5078_cast_fp16, var_4995_cast_fp16))[name = tensor("op_5236_cast_fp16")]; + tensor var_5237_to_fp16 = const()[name = tensor("op_5237_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_359_cast_fp16 = mul(x = var_5236_cast_fp16, y = var_5237_to_fp16)[name = tensor("aw_359_cast_fp16")]; + tensor var_5239_cast_fp16 = softmax(axis = var_4371, x = aw_321_cast_fp16)[name = tensor("op_5239_cast_fp16")]; + tensor var_5240_cast_fp16 = softmax(axis = var_4371, x = aw_323_cast_fp16)[name = tensor("op_5240_cast_fp16")]; + tensor var_5241_cast_fp16 = softmax(axis = var_4371, x = aw_325_cast_fp16)[name = tensor("op_5241_cast_fp16")]; + tensor var_5242_cast_fp16 = softmax(axis = var_4371, x = aw_327_cast_fp16)[name = tensor("op_5242_cast_fp16")]; + tensor var_5243_cast_fp16 = softmax(axis = var_4371, x = aw_329_cast_fp16)[name = tensor("op_5243_cast_fp16")]; + tensor var_5244_cast_fp16 = softmax(axis = var_4371, x = aw_331_cast_fp16)[name = tensor("op_5244_cast_fp16")]; + tensor var_5245_cast_fp16 = softmax(axis = var_4371, x = aw_333_cast_fp16)[name = tensor("op_5245_cast_fp16")]; + tensor var_5246_cast_fp16 = softmax(axis = var_4371, x = aw_335_cast_fp16)[name = tensor("op_5246_cast_fp16")]; + tensor var_5247_cast_fp16 = softmax(axis = var_4371, x = aw_337_cast_fp16)[name = tensor("op_5247_cast_fp16")]; + tensor var_5248_cast_fp16 = softmax(axis = var_4371, x = aw_339_cast_fp16)[name = tensor("op_5248_cast_fp16")]; + tensor var_5249_cast_fp16 = softmax(axis = var_4371, x = aw_341_cast_fp16)[name = tensor("op_5249_cast_fp16")]; + tensor var_5250_cast_fp16 = softmax(axis = var_4371, x = aw_343_cast_fp16)[name = tensor("op_5250_cast_fp16")]; + tensor var_5251_cast_fp16 = softmax(axis = var_4371, x = aw_345_cast_fp16)[name = tensor("op_5251_cast_fp16")]; + tensor var_5252_cast_fp16 = softmax(axis = var_4371, x = aw_347_cast_fp16)[name = tensor("op_5252_cast_fp16")]; + tensor var_5253_cast_fp16 = softmax(axis = var_4371, x = aw_349_cast_fp16)[name = tensor("op_5253_cast_fp16")]; + tensor var_5254_cast_fp16 = softmax(axis = var_4371, x = aw_351_cast_fp16)[name = tensor("op_5254_cast_fp16")]; + tensor var_5255_cast_fp16 = softmax(axis = var_4371, x = aw_353_cast_fp16)[name = tensor("op_5255_cast_fp16")]; + tensor var_5256_cast_fp16 = softmax(axis = var_4371, x = aw_355_cast_fp16)[name = tensor("op_5256_cast_fp16")]; + tensor var_5257_cast_fp16 = softmax(axis = var_4371, x = aw_357_cast_fp16)[name = tensor("op_5257_cast_fp16")]; + tensor var_5258_cast_fp16 = softmax(axis = var_4371, x = aw_359_cast_fp16)[name = tensor("op_5258_cast_fp16")]; + tensor var_5260_equation_0 = const()[name = tensor("op_5260_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5260_cast_fp16 = einsum(equation = var_5260_equation_0, values = (var_5080_cast_fp16, var_5239_cast_fp16))[name = tensor("op_5260_cast_fp16")]; + tensor var_5262_equation_0 = const()[name = tensor("op_5262_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5262_cast_fp16 = einsum(equation = var_5262_equation_0, values = (var_5084_cast_fp16, var_5240_cast_fp16))[name = tensor("op_5262_cast_fp16")]; + tensor var_5264_equation_0 = const()[name = tensor("op_5264_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5264_cast_fp16 = einsum(equation = var_5264_equation_0, values = (var_5088_cast_fp16, var_5241_cast_fp16))[name = tensor("op_5264_cast_fp16")]; + tensor var_5266_equation_0 = const()[name = tensor("op_5266_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5266_cast_fp16 = einsum(equation = var_5266_equation_0, values = (var_5092_cast_fp16, var_5242_cast_fp16))[name = tensor("op_5266_cast_fp16")]; + tensor var_5268_equation_0 = const()[name = tensor("op_5268_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5268_cast_fp16 = einsum(equation = var_5268_equation_0, values = (var_5096_cast_fp16, var_5243_cast_fp16))[name = tensor("op_5268_cast_fp16")]; + tensor var_5270_equation_0 = const()[name = tensor("op_5270_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5270_cast_fp16 = einsum(equation = var_5270_equation_0, values = (var_5100_cast_fp16, var_5244_cast_fp16))[name = tensor("op_5270_cast_fp16")]; + tensor var_5272_equation_0 = const()[name = tensor("op_5272_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5272_cast_fp16 = einsum(equation = var_5272_equation_0, values = (var_5104_cast_fp16, var_5245_cast_fp16))[name = tensor("op_5272_cast_fp16")]; + tensor var_5274_equation_0 = const()[name = tensor("op_5274_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5274_cast_fp16 = einsum(equation = var_5274_equation_0, values = (var_5108_cast_fp16, var_5246_cast_fp16))[name = tensor("op_5274_cast_fp16")]; + tensor var_5276_equation_0 = const()[name = tensor("op_5276_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5276_cast_fp16 = einsum(equation = var_5276_equation_0, values = (var_5112_cast_fp16, var_5247_cast_fp16))[name = tensor("op_5276_cast_fp16")]; + tensor var_5278_equation_0 = const()[name = tensor("op_5278_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5278_cast_fp16 = einsum(equation = var_5278_equation_0, values = (var_5116_cast_fp16, var_5248_cast_fp16))[name = tensor("op_5278_cast_fp16")]; + tensor var_5280_equation_0 = const()[name = tensor("op_5280_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5280_cast_fp16 = einsum(equation = var_5280_equation_0, values = (var_5120_cast_fp16, var_5249_cast_fp16))[name = tensor("op_5280_cast_fp16")]; + tensor var_5282_equation_0 = const()[name = tensor("op_5282_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5282_cast_fp16 = einsum(equation = var_5282_equation_0, values = (var_5124_cast_fp16, var_5250_cast_fp16))[name = tensor("op_5282_cast_fp16")]; + tensor var_5284_equation_0 = const()[name = tensor("op_5284_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5284_cast_fp16 = einsum(equation = var_5284_equation_0, values = (var_5128_cast_fp16, var_5251_cast_fp16))[name = tensor("op_5284_cast_fp16")]; + tensor var_5286_equation_0 = const()[name = tensor("op_5286_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5286_cast_fp16 = einsum(equation = var_5286_equation_0, values = (var_5132_cast_fp16, var_5252_cast_fp16))[name = tensor("op_5286_cast_fp16")]; + tensor var_5288_equation_0 = const()[name = tensor("op_5288_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5288_cast_fp16 = einsum(equation = var_5288_equation_0, values = (var_5136_cast_fp16, var_5253_cast_fp16))[name = tensor("op_5288_cast_fp16")]; + tensor var_5290_equation_0 = const()[name = tensor("op_5290_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5290_cast_fp16 = einsum(equation = var_5290_equation_0, values = (var_5140_cast_fp16, var_5254_cast_fp16))[name = tensor("op_5290_cast_fp16")]; + tensor var_5292_equation_0 = const()[name = tensor("op_5292_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5292_cast_fp16 = einsum(equation = var_5292_equation_0, values = (var_5144_cast_fp16, var_5255_cast_fp16))[name = tensor("op_5292_cast_fp16")]; + tensor var_5294_equation_0 = const()[name = tensor("op_5294_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5294_cast_fp16 = einsum(equation = var_5294_equation_0, values = (var_5148_cast_fp16, var_5256_cast_fp16))[name = tensor("op_5294_cast_fp16")]; + tensor var_5296_equation_0 = const()[name = tensor("op_5296_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5296_cast_fp16 = einsum(equation = var_5296_equation_0, values = (var_5152_cast_fp16, var_5257_cast_fp16))[name = tensor("op_5296_cast_fp16")]; + tensor var_5298_equation_0 = const()[name = tensor("op_5298_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_5298_cast_fp16 = einsum(equation = var_5298_equation_0, values = (var_5156_cast_fp16, var_5258_cast_fp16))[name = tensor("op_5298_cast_fp16")]; + tensor input_217_interleave_0 = const()[name = tensor("input_217_interleave_0"), val = tensor(false)]; + tensor input_217_cast_fp16 = concat(axis = var_4371, interleave = input_217_interleave_0, values = (var_5260_cast_fp16, var_5262_cast_fp16, var_5264_cast_fp16, var_5266_cast_fp16, var_5268_cast_fp16, var_5270_cast_fp16, var_5272_cast_fp16, var_5274_cast_fp16, var_5276_cast_fp16, var_5278_cast_fp16, var_5280_cast_fp16, var_5282_cast_fp16, var_5284_cast_fp16, var_5286_cast_fp16, var_5288_cast_fp16, var_5290_cast_fp16, var_5292_cast_fp16, var_5294_cast_fp16, var_5296_cast_fp16, var_5298_cast_fp16))[name = tensor("input_217_cast_fp16")]; + tensor var_5304 = const()[name = tensor("op_5304"), val = tensor([1, 1])]; + tensor var_5306 = const()[name = tensor("op_5306"), val = tensor([1, 1])]; + tensor var_5308_pad_type_0 = const()[name = tensor("op_5308_pad_type_0"), val = tensor("custom")]; + tensor var_5308_pad_0 = const()[name = tensor("op_5308_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(595166144)))]; + tensor mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(598443008)))]; + tensor var_5308_cast_fp16 = conv(bias = mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_5306, groups = var_4371, pad = var_5308_pad_0, pad_type = var_5308_pad_type_0, strides = var_5304, weight = mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_217_cast_fp16)[name = tensor("op_5308_cast_fp16")]; + tensor inputs_41_cast_fp16 = add(x = var_5308_cast_fp16, y = inputs_39_cast_fp16)[name = tensor("inputs_41_cast_fp16")]; + tensor var_5312 = const()[name = tensor("op_5312"), val = tensor([1])]; + tensor channels_mean_41_cast_fp16 = reduce_mean(axes = var_5312, keep_dims = var_4366, x = inputs_41_cast_fp16)[name = tensor("channels_mean_41_cast_fp16")]; + tensor zero_mean_41_cast_fp16 = sub(x = inputs_41_cast_fp16, y = channels_mean_41_cast_fp16)[name = tensor("zero_mean_41_cast_fp16")]; + tensor zero_mean_sq_41_cast_fp16 = mul(x = zero_mean_41_cast_fp16, y = zero_mean_41_cast_fp16)[name = tensor("zero_mean_sq_41_cast_fp16")]; + tensor var_5316 = const()[name = tensor("op_5316"), val = tensor([1])]; + tensor var_5317_cast_fp16 = reduce_mean(axes = var_5316, keep_dims = var_4366, x = zero_mean_sq_41_cast_fp16)[name = tensor("op_5317_cast_fp16")]; + tensor var_5318_to_fp16 = const()[name = tensor("op_5318_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_5319_cast_fp16 = add(x = var_5317_cast_fp16, y = var_5318_to_fp16)[name = tensor("op_5319_cast_fp16")]; + tensor denom_41_epsilon_0_to_fp16 = const()[name = tensor("denom_41_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_41_cast_fp16 = rsqrt(epsilon = denom_41_epsilon_0_to_fp16, x = var_5319_cast_fp16)[name = tensor("denom_41_cast_fp16")]; + tensor out_41_cast_fp16 = mul(x = zero_mean_41_cast_fp16, y = denom_41_cast_fp16)[name = tensor("out_41_cast_fp16")]; + tensor var_5323_to_fp16 = const()[name = tensor("op_5323_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(598445632)))]; + tensor var_5324_cast_fp16 = add(x = out_41_cast_fp16, y = var_5323_to_fp16)[name = tensor("op_5324_cast_fp16")]; + tensor var_5326_to_fp16 = const()[name = tensor("op_5326_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(598448256)))]; + tensor input_219_cast_fp16 = mul(x = var_5324_cast_fp16, y = var_5326_to_fp16)[name = tensor("input_219_cast_fp16")]; + tensor var_5334 = const()[name = tensor("op_5334"), val = tensor([1, 1])]; + tensor var_5336 = const()[name = tensor("op_5336"), val = tensor([1, 1])]; + tensor var_5338_pad_type_0 = const()[name = tensor("op_5338_pad_type_0"), val = tensor("custom")]; + tensor var_5338_pad_0 = const()[name = tensor("op_5338_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(598450880)))]; + tensor mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(624665344)))]; + tensor var_5338_cast_fp16 = conv(bias = mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_5336, groups = var_4371, pad = var_5338_pad_0, pad_type = var_5338_pad_type_0, strides = var_5334, weight = mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_219_cast_fp16)[name = tensor("op_5338_cast_fp16")]; + tensor var_5339_split_sizes_0 = const()[name = tensor("op_5339_split_sizes_0"), val = tensor([5120, 5120])]; + tensor var_5339_axis_0 = const()[name = tensor("op_5339_axis_0"), val = tensor(1)]; + tensor var_5339_cast_fp16_0, tensor var_5339_cast_fp16_1 = split(axis = var_5339_axis_0, split_sizes = var_5339_split_sizes_0, x = var_5338_cast_fp16)[name = tensor("op_5339_cast_fp16")]; + tensor var_5341_mode_0 = const()[name = tensor("op_5341_mode_0"), val = tensor("EXACT")]; + tensor var_5341_cast_fp16 = gelu(mode = var_5341_mode_0, x = var_5339_cast_fp16_1)[name = tensor("op_5341_cast_fp16")]; + tensor input_221_cast_fp16 = mul(x = var_5339_cast_fp16_0, y = var_5341_cast_fp16)[name = tensor("input_221_cast_fp16")]; + tensor var_5345 = const()[name = tensor("op_5345"), val = tensor([1, 1])]; + tensor var_5347 = const()[name = tensor("op_5347"), val = tensor([1, 1])]; + tensor var_5349_pad_type_0 = const()[name = tensor("op_5349_pad_type_0"), val = tensor("custom")]; + tensor var_5349_pad_0 = const()[name = tensor("op_5349_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(624685888)))]; + tensor mid_block_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(637793152)))]; + tensor var_5349_cast_fp16 = conv(bias = mid_block_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_5347, groups = var_4371, pad = var_5349_pad_0, pad_type = var_5349_pad_type_0, strides = var_5345, weight = mid_block_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_221_cast_fp16)[name = tensor("op_5349_cast_fp16")]; + tensor hidden_states_131_cast_fp16 = add(x = var_5349_cast_fp16, y = inputs_41_cast_fp16)[name = tensor("hidden_states_131_cast_fp16")]; + tensor var_5351 = const()[name = tensor("op_5351"), val = tensor([2, 1280, 6, 6])]; + tensor input_223_cast_fp16 = reshape(shape = var_5351, x = hidden_states_131_cast_fp16)[name = tensor("input_223_cast_fp16")]; + tensor var_5355 = const()[name = tensor("op_5355"), val = tensor([1, 1])]; + tensor var_5357 = const()[name = tensor("op_5357"), val = tensor([1, 1])]; + tensor hidden_states_133_pad_type_0 = const()[name = tensor("hidden_states_133_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_133_pad_0 = const()[name = tensor("hidden_states_133_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_attentions_0_proj_out_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(637795776)))]; + tensor mid_block_attentions_0_proj_out_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641072640)))]; + tensor hidden_states_133_cast_fp16 = conv(bias = mid_block_attentions_0_proj_out_bias_to_fp16, dilations = var_5357, groups = var_4371, pad = hidden_states_133_pad_0, pad_type = hidden_states_133_pad_type_0, strides = var_5355, weight = mid_block_attentions_0_proj_out_weight_to_fp16, x = input_223_cast_fp16)[name = tensor("hidden_states_133_cast_fp16")]; + tensor input_225_cast_fp16 = add(x = hidden_states_133_cast_fp16, y = hidden_states_121_cast_fp16)[name = tensor("input_225_cast_fp16")]; + tensor reshape_100_shape_0 = const()[name = tensor("reshape_100_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_100_cast_fp16 = reshape(shape = reshape_100_shape_0, x = input_225_cast_fp16)[name = tensor("reshape_100_cast_fp16")]; + tensor reduce_mean_75_axes_0 = const()[name = tensor("reduce_mean_75_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_75_keep_dims_0 = const()[name = tensor("reduce_mean_75_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_75_cast_fp16 = reduce_mean(axes = reduce_mean_75_axes_0, keep_dims = reduce_mean_75_keep_dims_0, x = reshape_100_cast_fp16)[name = tensor("reduce_mean_75_cast_fp16")]; + tensor sub_50_cast_fp16 = sub(x = reshape_100_cast_fp16, y = reduce_mean_75_cast_fp16)[name = tensor("sub_50_cast_fp16")]; + tensor square_25_cast_fp16 = square(x = sub_50_cast_fp16)[name = tensor("square_25_cast_fp16")]; + tensor reduce_mean_77_axes_0 = const()[name = tensor("reduce_mean_77_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_77_keep_dims_0 = const()[name = tensor("reduce_mean_77_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_77_cast_fp16 = reduce_mean(axes = reduce_mean_77_axes_0, keep_dims = reduce_mean_77_keep_dims_0, x = square_25_cast_fp16)[name = tensor("reduce_mean_77_cast_fp16")]; + tensor add_50_y_0_to_fp16 = const()[name = tensor("add_50_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_50_cast_fp16 = add(x = reduce_mean_77_cast_fp16, y = add_50_y_0_to_fp16)[name = tensor("add_50_cast_fp16")]; + tensor sqrt_25_cast_fp16 = sqrt(x = add_50_cast_fp16)[name = tensor("sqrt_25_cast_fp16")]; + tensor real_div_25_cast_fp16 = real_div(x = sub_50_cast_fp16, y = sqrt_25_cast_fp16)[name = tensor("real_div_25_cast_fp16")]; + tensor reshape_101_shape_0 = const()[name = tensor("reshape_101_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_101_cast_fp16 = reshape(shape = reshape_101_shape_0, x = real_div_25_cast_fp16)[name = tensor("reshape_101_cast_fp16")]; + tensor add_51_gamma_0_to_fp16 = const()[name = tensor("add_51_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641075264)))]; + tensor add_51_beta_0_to_fp16 = const()[name = tensor("add_51_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641077888)))]; + tensor add_51_epsilon_0_to_fp16 = const()[name = tensor("add_51_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_51_cast_fp16 = batch_norm(beta = add_51_beta_0_to_fp16, epsilon = add_51_epsilon_0_to_fp16, gamma = add_51_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_101_cast_fp16)[name = tensor("add_51_cast_fp16")]; + tensor input_229_cast_fp16 = silu(x = add_51_cast_fp16)[name = tensor("input_229_cast_fp16")]; + tensor var_5372 = const()[name = tensor("op_5372"), val = tensor([1, 1])]; + tensor var_5374 = const()[name = tensor("op_5374"), val = tensor([1, 1])]; + tensor hidden_states_135_pad_type_0 = const()[name = tensor("hidden_states_135_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_135_pad_0 = const()[name = tensor("hidden_states_135_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor mid_block_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("mid_block_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641080512)))]; + tensor mid_block_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("mid_block_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(670571776)))]; + tensor hidden_states_135_cast_fp16 = conv(bias = mid_block_resnets_1_conv1_bias_to_fp16, dilations = var_5374, groups = var_4371, pad = hidden_states_135_pad_0, pad_type = hidden_states_135_pad_type_0, strides = var_5372, weight = mid_block_resnets_1_conv1_weight_to_fp16, x = input_229_cast_fp16)[name = tensor("hidden_states_135_cast_fp16")]; + tensor var_5380 = const()[name = tensor("op_5380"), val = tensor([1, 1])]; + tensor var_5382 = const()[name = tensor("op_5382"), val = tensor([1, 1])]; + tensor temb_19_pad_type_0 = const()[name = tensor("temb_19_pad_type_0"), val = tensor("custom")]; + tensor temb_19_pad_0 = const()[name = tensor("temb_19_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor mid_block_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("mid_block_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(670574400)))]; + tensor mid_block_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("mid_block_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(673851264)))]; + tensor temb_19_cast_fp16 = conv(bias = mid_block_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_5382, groups = var_4371, pad = temb_19_pad_0, pad_type = temb_19_pad_type_0, strides = var_5380, weight = mid_block_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_19_cast_fp16")]; + tensor input_233_cast_fp16 = add(x = hidden_states_135_cast_fp16, y = temb_19_cast_fp16)[name = tensor("input_233_cast_fp16")]; + tensor reshape_104_shape_0 = const()[name = tensor("reshape_104_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_104_cast_fp16 = reshape(shape = reshape_104_shape_0, x = input_233_cast_fp16)[name = tensor("reshape_104_cast_fp16")]; + tensor reduce_mean_78_axes_0 = const()[name = tensor("reduce_mean_78_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_78_keep_dims_0 = const()[name = tensor("reduce_mean_78_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_78_cast_fp16 = reduce_mean(axes = reduce_mean_78_axes_0, keep_dims = reduce_mean_78_keep_dims_0, x = reshape_104_cast_fp16)[name = tensor("reduce_mean_78_cast_fp16")]; + tensor sub_52_cast_fp16 = sub(x = reshape_104_cast_fp16, y = reduce_mean_78_cast_fp16)[name = tensor("sub_52_cast_fp16")]; + tensor square_26_cast_fp16 = square(x = sub_52_cast_fp16)[name = tensor("square_26_cast_fp16")]; + tensor reduce_mean_80_axes_0 = const()[name = tensor("reduce_mean_80_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_80_keep_dims_0 = const()[name = tensor("reduce_mean_80_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_80_cast_fp16 = reduce_mean(axes = reduce_mean_80_axes_0, keep_dims = reduce_mean_80_keep_dims_0, x = square_26_cast_fp16)[name = tensor("reduce_mean_80_cast_fp16")]; + tensor add_52_y_0_to_fp16 = const()[name = tensor("add_52_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_52_cast_fp16 = add(x = reduce_mean_80_cast_fp16, y = add_52_y_0_to_fp16)[name = tensor("add_52_cast_fp16")]; + tensor sqrt_26_cast_fp16 = sqrt(x = add_52_cast_fp16)[name = tensor("sqrt_26_cast_fp16")]; + tensor real_div_26_cast_fp16 = real_div(x = sub_52_cast_fp16, y = sqrt_26_cast_fp16)[name = tensor("real_div_26_cast_fp16")]; + tensor reshape_105_shape_0 = const()[name = tensor("reshape_105_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_105_cast_fp16 = reshape(shape = reshape_105_shape_0, x = real_div_26_cast_fp16)[name = tensor("reshape_105_cast_fp16")]; + tensor add_53_gamma_0_to_fp16 = const()[name = tensor("add_53_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(673853888)))]; + tensor add_53_beta_0_to_fp16 = const()[name = tensor("add_53_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(673856512)))]; + tensor add_53_epsilon_0_to_fp16 = const()[name = tensor("add_53_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_53_cast_fp16 = batch_norm(beta = add_53_beta_0_to_fp16, epsilon = add_53_epsilon_0_to_fp16, gamma = add_53_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_105_cast_fp16)[name = tensor("add_53_cast_fp16")]; + tensor input_237_cast_fp16 = silu(x = add_53_cast_fp16)[name = tensor("input_237_cast_fp16")]; + tensor var_5392 = const()[name = tensor("op_5392"), val = tensor([1, 1])]; + tensor var_5394 = const()[name = tensor("op_5394"), val = tensor([1, 1])]; + tensor hidden_states_137_pad_type_0 = const()[name = tensor("hidden_states_137_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_137_pad_0 = const()[name = tensor("hidden_states_137_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor mid_block_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("mid_block_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(673859136)))]; + tensor mid_block_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("mid_block_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703350400)))]; + tensor hidden_states_137_cast_fp16 = conv(bias = mid_block_resnets_1_conv2_bias_to_fp16, dilations = var_5394, groups = var_4371, pad = hidden_states_137_pad_0, pad_type = hidden_states_137_pad_type_0, strides = var_5392, weight = mid_block_resnets_1_conv2_weight_to_fp16, x = input_237_cast_fp16)[name = tensor("hidden_states_137_cast_fp16")]; + tensor hidden_states_139_cast_fp16 = add(x = input_225_cast_fp16, y = hidden_states_137_cast_fp16)[name = tensor("hidden_states_139_cast_fp16")]; + tensor var_5405 = const()[name = tensor("op_5405"), val = tensor(1)]; + tensor input_239_interleave_0 = const()[name = tensor("input_239_interleave_0"), val = tensor(false)]; + tensor input_239_cast_fp16 = concat(axis = var_5405, interleave = input_239_interleave_0, values = (hidden_states_139_cast_fp16, input_199_cast_fp16))[name = tensor("input_239_cast_fp16")]; + tensor reshape_108_shape_0 = const()[name = tensor("reshape_108_shape_0"), val = tensor([2, 32, 80, 6, 6])]; + tensor reshape_108_cast_fp16 = reshape(shape = reshape_108_shape_0, x = input_239_cast_fp16)[name = tensor("reshape_108_cast_fp16")]; + tensor reduce_mean_81_axes_0 = const()[name = tensor("reduce_mean_81_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_81_keep_dims_0 = const()[name = tensor("reduce_mean_81_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_81_cast_fp16 = reduce_mean(axes = reduce_mean_81_axes_0, keep_dims = reduce_mean_81_keep_dims_0, x = reshape_108_cast_fp16)[name = tensor("reduce_mean_81_cast_fp16")]; + tensor sub_54_cast_fp16 = sub(x = reshape_108_cast_fp16, y = reduce_mean_81_cast_fp16)[name = tensor("sub_54_cast_fp16")]; + tensor square_27_cast_fp16 = square(x = sub_54_cast_fp16)[name = tensor("square_27_cast_fp16")]; + tensor reduce_mean_83_axes_0 = const()[name = tensor("reduce_mean_83_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_83_keep_dims_0 = const()[name = tensor("reduce_mean_83_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_83_cast_fp16 = reduce_mean(axes = reduce_mean_83_axes_0, keep_dims = reduce_mean_83_keep_dims_0, x = square_27_cast_fp16)[name = tensor("reduce_mean_83_cast_fp16")]; + tensor add_54_y_0_to_fp16 = const()[name = tensor("add_54_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_54_cast_fp16 = add(x = reduce_mean_83_cast_fp16, y = add_54_y_0_to_fp16)[name = tensor("add_54_cast_fp16")]; + tensor sqrt_27_cast_fp16 = sqrt(x = add_54_cast_fp16)[name = tensor("sqrt_27_cast_fp16")]; + tensor real_div_27_cast_fp16 = real_div(x = sub_54_cast_fp16, y = sqrt_27_cast_fp16)[name = tensor("real_div_27_cast_fp16")]; + tensor reshape_109_shape_0 = const()[name = tensor("reshape_109_shape_0"), val = tensor([2, 2560, 6, 6])]; + tensor reshape_109_cast_fp16 = reshape(shape = reshape_109_shape_0, x = real_div_27_cast_fp16)[name = tensor("reshape_109_cast_fp16")]; + tensor add_55_mean_0_to_fp16 = const()[name = tensor("add_55_mean_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703353024)))]; + tensor add_55_variance_0_to_fp16 = const()[name = tensor("add_55_variance_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703358208)))]; + tensor add_55_gamma_0_to_fp16 = const()[name = tensor("add_55_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703363392)))]; + tensor add_55_beta_0_to_fp16 = const()[name = tensor("add_55_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703368576)))]; + tensor add_55_epsilon_0_to_fp16 = const()[name = tensor("add_55_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_55_cast_fp16 = batch_norm(beta = add_55_beta_0_to_fp16, epsilon = add_55_epsilon_0_to_fp16, gamma = add_55_gamma_0_to_fp16, mean = add_55_mean_0_to_fp16, variance = add_55_variance_0_to_fp16, x = reshape_109_cast_fp16)[name = tensor("add_55_cast_fp16")]; + tensor input_243_cast_fp16 = silu(x = add_55_cast_fp16)[name = tensor("input_243_cast_fp16")]; + tensor var_5428 = const()[name = tensor("op_5428"), val = tensor([1, 1])]; + tensor var_5430 = const()[name = tensor("op_5430"), val = tensor([1, 1])]; + tensor hidden_states_141_pad_type_0 = const()[name = tensor("hidden_states_141_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_141_pad_0 = const()[name = tensor("hidden_states_141_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_0_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703373760)))]; + tensor up_blocks_0_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762356224)))]; + tensor hidden_states_141_cast_fp16 = conv(bias = up_blocks_0_resnets_0_conv1_bias_to_fp16, dilations = var_5430, groups = var_5405, pad = hidden_states_141_pad_0, pad_type = hidden_states_141_pad_type_0, strides = var_5428, weight = up_blocks_0_resnets_0_conv1_weight_to_fp16, x = input_243_cast_fp16)[name = tensor("hidden_states_141_cast_fp16")]; + tensor var_5436 = const()[name = tensor("op_5436"), val = tensor([1, 1])]; + tensor var_5438 = const()[name = tensor("op_5438"), val = tensor([1, 1])]; + tensor temb_21_pad_type_0 = const()[name = tensor("temb_21_pad_type_0"), val = tensor("custom")]; + tensor temb_21_pad_0 = const()[name = tensor("temb_21_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_0_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762358848)))]; + tensor up_blocks_0_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765635712)))]; + tensor temb_21_cast_fp16 = conv(bias = up_blocks_0_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_5438, groups = var_5405, pad = temb_21_pad_0, pad_type = temb_21_pad_type_0, strides = var_5436, weight = up_blocks_0_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_21_cast_fp16")]; + tensor input_247_cast_fp16 = add(x = hidden_states_141_cast_fp16, y = temb_21_cast_fp16)[name = tensor("input_247_cast_fp16")]; + tensor reshape_112_shape_0 = const()[name = tensor("reshape_112_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_112_cast_fp16 = reshape(shape = reshape_112_shape_0, x = input_247_cast_fp16)[name = tensor("reshape_112_cast_fp16")]; + tensor reduce_mean_84_axes_0 = const()[name = tensor("reduce_mean_84_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_84_keep_dims_0 = const()[name = tensor("reduce_mean_84_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_84_cast_fp16 = reduce_mean(axes = reduce_mean_84_axes_0, keep_dims = reduce_mean_84_keep_dims_0, x = reshape_112_cast_fp16)[name = tensor("reduce_mean_84_cast_fp16")]; + tensor sub_56_cast_fp16 = sub(x = reshape_112_cast_fp16, y = reduce_mean_84_cast_fp16)[name = tensor("sub_56_cast_fp16")]; + tensor square_28_cast_fp16 = square(x = sub_56_cast_fp16)[name = tensor("square_28_cast_fp16")]; + tensor reduce_mean_86_axes_0 = const()[name = tensor("reduce_mean_86_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_86_keep_dims_0 = const()[name = tensor("reduce_mean_86_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_86_cast_fp16 = reduce_mean(axes = reduce_mean_86_axes_0, keep_dims = reduce_mean_86_keep_dims_0, x = square_28_cast_fp16)[name = tensor("reduce_mean_86_cast_fp16")]; + tensor add_56_y_0_to_fp16 = const()[name = tensor("add_56_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_56_cast_fp16 = add(x = reduce_mean_86_cast_fp16, y = add_56_y_0_to_fp16)[name = tensor("add_56_cast_fp16")]; + tensor sqrt_28_cast_fp16 = sqrt(x = add_56_cast_fp16)[name = tensor("sqrt_28_cast_fp16")]; + tensor real_div_28_cast_fp16 = real_div(x = sub_56_cast_fp16, y = sqrt_28_cast_fp16)[name = tensor("real_div_28_cast_fp16")]; + tensor reshape_113_shape_0 = const()[name = tensor("reshape_113_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_113_cast_fp16 = reshape(shape = reshape_113_shape_0, x = real_div_28_cast_fp16)[name = tensor("reshape_113_cast_fp16")]; + tensor add_57_gamma_0_to_fp16 = const()[name = tensor("add_57_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765638336)))]; + tensor add_57_beta_0_to_fp16 = const()[name = tensor("add_57_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765640960)))]; + tensor add_57_epsilon_0_to_fp16 = const()[name = tensor("add_57_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_57_cast_fp16 = batch_norm(beta = add_57_beta_0_to_fp16, epsilon = add_57_epsilon_0_to_fp16, gamma = add_57_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_113_cast_fp16)[name = tensor("add_57_cast_fp16")]; + tensor input_251_cast_fp16 = silu(x = add_57_cast_fp16)[name = tensor("input_251_cast_fp16")]; + tensor var_5448 = const()[name = tensor("op_5448"), val = tensor([1, 1])]; + tensor var_5450 = const()[name = tensor("op_5450"), val = tensor([1, 1])]; + tensor hidden_states_143_pad_type_0 = const()[name = tensor("hidden_states_143_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_143_pad_0 = const()[name = tensor("hidden_states_143_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_0_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765643584)))]; + tensor up_blocks_0_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(795134848)))]; + tensor hidden_states_143_cast_fp16 = conv(bias = up_blocks_0_resnets_0_conv2_bias_to_fp16, dilations = var_5450, groups = var_5405, pad = hidden_states_143_pad_0, pad_type = hidden_states_143_pad_type_0, strides = var_5448, weight = up_blocks_0_resnets_0_conv2_weight_to_fp16, x = input_251_cast_fp16)[name = tensor("hidden_states_143_cast_fp16")]; + tensor var_5455 = const()[name = tensor("op_5455"), val = tensor([1, 1])]; + tensor var_5457 = const()[name = tensor("op_5457"), val = tensor([1, 1])]; + tensor x_5_pad_type_0 = const()[name = tensor("x_5_pad_type_0"), val = tensor("custom")]; + tensor x_5_pad_0 = const()[name = tensor("x_5_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_0_resnets_0_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(795137472)))]; + tensor up_blocks_0_resnets_0_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801691136)))]; + tensor x_5_cast_fp16 = conv(bias = up_blocks_0_resnets_0_conv_shortcut_bias_to_fp16, dilations = var_5457, groups = var_5405, pad = x_5_pad_0, pad_type = x_5_pad_type_0, strides = var_5455, weight = up_blocks_0_resnets_0_conv_shortcut_weight_to_fp16, x = input_239_cast_fp16)[name = tensor("x_5_cast_fp16")]; + tensor hidden_states_145_cast_fp16 = add(x = x_5_cast_fp16, y = hidden_states_143_cast_fp16)[name = tensor("hidden_states_145_cast_fp16")]; + tensor input_253_interleave_0 = const()[name = tensor("input_253_interleave_0"), val = tensor(false)]; + tensor input_253_cast_fp16 = concat(axis = var_5405, interleave = input_253_interleave_0, values = (hidden_states_145_cast_fp16, input_185_cast_fp16))[name = tensor("input_253_cast_fp16")]; + tensor reshape_116_shape_0 = const()[name = tensor("reshape_116_shape_0"), val = tensor([2, 32, 80, 6, 6])]; + tensor reshape_116_cast_fp16 = reshape(shape = reshape_116_shape_0, x = input_253_cast_fp16)[name = tensor("reshape_116_cast_fp16")]; + tensor reduce_mean_87_axes_0 = const()[name = tensor("reduce_mean_87_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_87_keep_dims_0 = const()[name = tensor("reduce_mean_87_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_87_cast_fp16 = reduce_mean(axes = reduce_mean_87_axes_0, keep_dims = reduce_mean_87_keep_dims_0, x = reshape_116_cast_fp16)[name = tensor("reduce_mean_87_cast_fp16")]; + tensor sub_58_cast_fp16 = sub(x = reshape_116_cast_fp16, y = reduce_mean_87_cast_fp16)[name = tensor("sub_58_cast_fp16")]; + tensor square_29_cast_fp16 = square(x = sub_58_cast_fp16)[name = tensor("square_29_cast_fp16")]; + tensor reduce_mean_89_axes_0 = const()[name = tensor("reduce_mean_89_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_89_keep_dims_0 = const()[name = tensor("reduce_mean_89_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_89_cast_fp16 = reduce_mean(axes = reduce_mean_89_axes_0, keep_dims = reduce_mean_89_keep_dims_0, x = square_29_cast_fp16)[name = tensor("reduce_mean_89_cast_fp16")]; + tensor add_58_y_0_to_fp16 = const()[name = tensor("add_58_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_58_cast_fp16 = add(x = reduce_mean_89_cast_fp16, y = add_58_y_0_to_fp16)[name = tensor("add_58_cast_fp16")]; + tensor sqrt_29_cast_fp16 = sqrt(x = add_58_cast_fp16)[name = tensor("sqrt_29_cast_fp16")]; + tensor real_div_29_cast_fp16 = real_div(x = sub_58_cast_fp16, y = sqrt_29_cast_fp16)[name = tensor("real_div_29_cast_fp16")]; + tensor reshape_117_shape_0 = const()[name = tensor("reshape_117_shape_0"), val = tensor([2, 2560, 6, 6])]; + tensor reshape_117_cast_fp16 = reshape(shape = reshape_117_shape_0, x = real_div_29_cast_fp16)[name = tensor("reshape_117_cast_fp16")]; + tensor add_59_gamma_0_to_fp16 = const()[name = tensor("add_59_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801693760)))]; + tensor add_59_beta_0_to_fp16 = const()[name = tensor("add_59_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801698944)))]; + tensor add_59_epsilon_0_to_fp16 = const()[name = tensor("add_59_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_59_cast_fp16 = batch_norm(beta = add_59_beta_0_to_fp16, epsilon = add_59_epsilon_0_to_fp16, gamma = add_59_gamma_0_to_fp16, mean = add_55_mean_0_to_fp16, variance = add_55_variance_0_to_fp16, x = reshape_117_cast_fp16)[name = tensor("add_59_cast_fp16")]; + tensor input_257_cast_fp16 = silu(x = add_59_cast_fp16)[name = tensor("input_257_cast_fp16")]; + tensor var_5475 = const()[name = tensor("op_5475"), val = tensor([1, 1])]; + tensor var_5477 = const()[name = tensor("op_5477"), val = tensor([1, 1])]; + tensor hidden_states_147_pad_type_0 = const()[name = tensor("hidden_states_147_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_147_pad_0 = const()[name = tensor("hidden_states_147_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_0_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801704128)))]; + tensor up_blocks_0_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(860686592)))]; + tensor hidden_states_147_cast_fp16 = conv(bias = up_blocks_0_resnets_1_conv1_bias_to_fp16, dilations = var_5477, groups = var_5405, pad = hidden_states_147_pad_0, pad_type = hidden_states_147_pad_type_0, strides = var_5475, weight = up_blocks_0_resnets_1_conv1_weight_to_fp16, x = input_257_cast_fp16)[name = tensor("hidden_states_147_cast_fp16")]; + tensor var_5483 = const()[name = tensor("op_5483"), val = tensor([1, 1])]; + tensor var_5485 = const()[name = tensor("op_5485"), val = tensor([1, 1])]; + tensor temb_23_pad_type_0 = const()[name = tensor("temb_23_pad_type_0"), val = tensor("custom")]; + tensor temb_23_pad_0 = const()[name = tensor("temb_23_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_0_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(860689216)))]; + tensor up_blocks_0_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(863966080)))]; + tensor temb_23_cast_fp16 = conv(bias = up_blocks_0_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_5485, groups = var_5405, pad = temb_23_pad_0, pad_type = temb_23_pad_type_0, strides = var_5483, weight = up_blocks_0_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_23_cast_fp16")]; + tensor input_261_cast_fp16 = add(x = hidden_states_147_cast_fp16, y = temb_23_cast_fp16)[name = tensor("input_261_cast_fp16")]; + tensor reshape_120_shape_0 = const()[name = tensor("reshape_120_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_120_cast_fp16 = reshape(shape = reshape_120_shape_0, x = input_261_cast_fp16)[name = tensor("reshape_120_cast_fp16")]; + tensor reduce_mean_90_axes_0 = const()[name = tensor("reduce_mean_90_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_90_keep_dims_0 = const()[name = tensor("reduce_mean_90_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_90_cast_fp16 = reduce_mean(axes = reduce_mean_90_axes_0, keep_dims = reduce_mean_90_keep_dims_0, x = reshape_120_cast_fp16)[name = tensor("reduce_mean_90_cast_fp16")]; + tensor sub_60_cast_fp16 = sub(x = reshape_120_cast_fp16, y = reduce_mean_90_cast_fp16)[name = tensor("sub_60_cast_fp16")]; + tensor square_30_cast_fp16 = square(x = sub_60_cast_fp16)[name = tensor("square_30_cast_fp16")]; + tensor reduce_mean_92_axes_0 = const()[name = tensor("reduce_mean_92_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_92_keep_dims_0 = const()[name = tensor("reduce_mean_92_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_92_cast_fp16 = reduce_mean(axes = reduce_mean_92_axes_0, keep_dims = reduce_mean_92_keep_dims_0, x = square_30_cast_fp16)[name = tensor("reduce_mean_92_cast_fp16")]; + tensor add_60_y_0_to_fp16 = const()[name = tensor("add_60_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_60_cast_fp16 = add(x = reduce_mean_92_cast_fp16, y = add_60_y_0_to_fp16)[name = tensor("add_60_cast_fp16")]; + tensor sqrt_30_cast_fp16 = sqrt(x = add_60_cast_fp16)[name = tensor("sqrt_30_cast_fp16")]; + tensor real_div_30_cast_fp16 = real_div(x = sub_60_cast_fp16, y = sqrt_30_cast_fp16)[name = tensor("real_div_30_cast_fp16")]; + tensor reshape_121_shape_0 = const()[name = tensor("reshape_121_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_121_cast_fp16 = reshape(shape = reshape_121_shape_0, x = real_div_30_cast_fp16)[name = tensor("reshape_121_cast_fp16")]; + tensor add_61_gamma_0_to_fp16 = const()[name = tensor("add_61_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(863968704)))]; + tensor add_61_beta_0_to_fp16 = const()[name = tensor("add_61_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(863971328)))]; + tensor add_61_epsilon_0_to_fp16 = const()[name = tensor("add_61_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_61_cast_fp16 = batch_norm(beta = add_61_beta_0_to_fp16, epsilon = add_61_epsilon_0_to_fp16, gamma = add_61_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_121_cast_fp16)[name = tensor("add_61_cast_fp16")]; + tensor input_265_cast_fp16 = silu(x = add_61_cast_fp16)[name = tensor("input_265_cast_fp16")]; + tensor var_5495 = const()[name = tensor("op_5495"), val = tensor([1, 1])]; + tensor var_5497 = const()[name = tensor("op_5497"), val = tensor([1, 1])]; + tensor hidden_states_149_pad_type_0 = const()[name = tensor("hidden_states_149_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_149_pad_0 = const()[name = tensor("hidden_states_149_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_0_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(863973952)))]; + tensor up_blocks_0_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(893465216)))]; + tensor hidden_states_149_cast_fp16 = conv(bias = up_blocks_0_resnets_1_conv2_bias_to_fp16, dilations = var_5497, groups = var_5405, pad = hidden_states_149_pad_0, pad_type = hidden_states_149_pad_type_0, strides = var_5495, weight = up_blocks_0_resnets_1_conv2_weight_to_fp16, x = input_265_cast_fp16)[name = tensor("hidden_states_149_cast_fp16")]; + tensor var_5502 = const()[name = tensor("op_5502"), val = tensor([1, 1])]; + tensor var_5504 = const()[name = tensor("op_5504"), val = tensor([1, 1])]; + tensor x_7_pad_type_0 = const()[name = tensor("x_7_pad_type_0"), val = tensor("custom")]; + tensor x_7_pad_0 = const()[name = tensor("x_7_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_0_resnets_1_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(893467840)))]; + tensor up_blocks_0_resnets_1_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(900021504)))]; + tensor x_7_cast_fp16 = conv(bias = up_blocks_0_resnets_1_conv_shortcut_bias_to_fp16, dilations = var_5504, groups = var_5405, pad = x_7_pad_0, pad_type = x_7_pad_type_0, strides = var_5502, weight = up_blocks_0_resnets_1_conv_shortcut_weight_to_fp16, x = input_253_cast_fp16)[name = tensor("x_7_cast_fp16")]; + tensor hidden_states_151_cast_fp16 = add(x = x_7_cast_fp16, y = hidden_states_149_cast_fp16)[name = tensor("hidden_states_151_cast_fp16")]; + tensor input_267_interleave_0 = const()[name = tensor("input_267_interleave_0"), val = tensor(false)]; + tensor input_267_cast_fp16 = concat(axis = var_5405, interleave = input_267_interleave_0, values = (hidden_states_151_cast_fp16, input_171_cast_fp16))[name = tensor("input_267_cast_fp16")]; + tensor reshape_124_shape_0 = const()[name = tensor("reshape_124_shape_0"), val = tensor([2, 32, 80, 6, 6])]; + tensor reshape_124_cast_fp16 = reshape(shape = reshape_124_shape_0, x = input_267_cast_fp16)[name = tensor("reshape_124_cast_fp16")]; + tensor reduce_mean_93_axes_0 = const()[name = tensor("reduce_mean_93_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_93_keep_dims_0 = const()[name = tensor("reduce_mean_93_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_93_cast_fp16 = reduce_mean(axes = reduce_mean_93_axes_0, keep_dims = reduce_mean_93_keep_dims_0, x = reshape_124_cast_fp16)[name = tensor("reduce_mean_93_cast_fp16")]; + tensor sub_62_cast_fp16 = sub(x = reshape_124_cast_fp16, y = reduce_mean_93_cast_fp16)[name = tensor("sub_62_cast_fp16")]; + tensor square_31_cast_fp16 = square(x = sub_62_cast_fp16)[name = tensor("square_31_cast_fp16")]; + tensor reduce_mean_95_axes_0 = const()[name = tensor("reduce_mean_95_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_95_keep_dims_0 = const()[name = tensor("reduce_mean_95_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_95_cast_fp16 = reduce_mean(axes = reduce_mean_95_axes_0, keep_dims = reduce_mean_95_keep_dims_0, x = square_31_cast_fp16)[name = tensor("reduce_mean_95_cast_fp16")]; + tensor add_62_y_0_to_fp16 = const()[name = tensor("add_62_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_62_cast_fp16 = add(x = reduce_mean_95_cast_fp16, y = add_62_y_0_to_fp16)[name = tensor("add_62_cast_fp16")]; + tensor sqrt_31_cast_fp16 = sqrt(x = add_62_cast_fp16)[name = tensor("sqrt_31_cast_fp16")]; + tensor real_div_31_cast_fp16 = real_div(x = sub_62_cast_fp16, y = sqrt_31_cast_fp16)[name = tensor("real_div_31_cast_fp16")]; + tensor reshape_125_shape_0 = const()[name = tensor("reshape_125_shape_0"), val = tensor([2, 2560, 6, 6])]; + tensor reshape_125_cast_fp16 = reshape(shape = reshape_125_shape_0, x = real_div_31_cast_fp16)[name = tensor("reshape_125_cast_fp16")]; + tensor add_63_gamma_0_to_fp16 = const()[name = tensor("add_63_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(900024128)))]; + tensor add_63_beta_0_to_fp16 = const()[name = tensor("add_63_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(900029312)))]; + tensor add_63_epsilon_0_to_fp16 = const()[name = tensor("add_63_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_63_cast_fp16 = batch_norm(beta = add_63_beta_0_to_fp16, epsilon = add_63_epsilon_0_to_fp16, gamma = add_63_gamma_0_to_fp16, mean = add_55_mean_0_to_fp16, variance = add_55_variance_0_to_fp16, x = reshape_125_cast_fp16)[name = tensor("add_63_cast_fp16")]; + tensor input_271_cast_fp16 = silu(x = add_63_cast_fp16)[name = tensor("input_271_cast_fp16")]; + tensor var_5522 = const()[name = tensor("op_5522"), val = tensor([1, 1])]; + tensor var_5524 = const()[name = tensor("op_5524"), val = tensor([1, 1])]; + tensor hidden_states_153_pad_type_0 = const()[name = tensor("hidden_states_153_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_153_pad_0 = const()[name = tensor("hidden_states_153_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_0_resnets_2_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_2_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(900034496)))]; + tensor up_blocks_0_resnets_2_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_2_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(959016960)))]; + tensor hidden_states_153_cast_fp16 = conv(bias = up_blocks_0_resnets_2_conv1_bias_to_fp16, dilations = var_5524, groups = var_5405, pad = hidden_states_153_pad_0, pad_type = hidden_states_153_pad_type_0, strides = var_5522, weight = up_blocks_0_resnets_2_conv1_weight_to_fp16, x = input_271_cast_fp16)[name = tensor("hidden_states_153_cast_fp16")]; + tensor var_5530 = const()[name = tensor("op_5530"), val = tensor([1, 1])]; + tensor var_5532 = const()[name = tensor("op_5532"), val = tensor([1, 1])]; + tensor temb_25_pad_type_0 = const()[name = tensor("temb_25_pad_type_0"), val = tensor("custom")]; + tensor temb_25_pad_0 = const()[name = tensor("temb_25_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_0_resnets_2_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_2_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(959019584)))]; + tensor up_blocks_0_resnets_2_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_2_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(962296448)))]; + tensor temb_25_cast_fp16 = conv(bias = up_blocks_0_resnets_2_time_emb_proj_bias_to_fp16, dilations = var_5532, groups = var_5405, pad = temb_25_pad_0, pad_type = temb_25_pad_type_0, strides = var_5530, weight = up_blocks_0_resnets_2_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_25_cast_fp16")]; + tensor input_275_cast_fp16 = add(x = hidden_states_153_cast_fp16, y = temb_25_cast_fp16)[name = tensor("input_275_cast_fp16")]; + tensor reshape_128_shape_0 = const()[name = tensor("reshape_128_shape_0"), val = tensor([2, 32, 40, 6, 6])]; + tensor reshape_128_cast_fp16 = reshape(shape = reshape_128_shape_0, x = input_275_cast_fp16)[name = tensor("reshape_128_cast_fp16")]; + tensor reduce_mean_96_axes_0 = const()[name = tensor("reduce_mean_96_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_96_keep_dims_0 = const()[name = tensor("reduce_mean_96_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_96_cast_fp16 = reduce_mean(axes = reduce_mean_96_axes_0, keep_dims = reduce_mean_96_keep_dims_0, x = reshape_128_cast_fp16)[name = tensor("reduce_mean_96_cast_fp16")]; + tensor sub_64_cast_fp16 = sub(x = reshape_128_cast_fp16, y = reduce_mean_96_cast_fp16)[name = tensor("sub_64_cast_fp16")]; + tensor square_32_cast_fp16 = square(x = sub_64_cast_fp16)[name = tensor("square_32_cast_fp16")]; + tensor reduce_mean_98_axes_0 = const()[name = tensor("reduce_mean_98_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_98_keep_dims_0 = const()[name = tensor("reduce_mean_98_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_98_cast_fp16 = reduce_mean(axes = reduce_mean_98_axes_0, keep_dims = reduce_mean_98_keep_dims_0, x = square_32_cast_fp16)[name = tensor("reduce_mean_98_cast_fp16")]; + tensor add_64_y_0_to_fp16 = const()[name = tensor("add_64_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_64_cast_fp16 = add(x = reduce_mean_98_cast_fp16, y = add_64_y_0_to_fp16)[name = tensor("add_64_cast_fp16")]; + tensor sqrt_32_cast_fp16 = sqrt(x = add_64_cast_fp16)[name = tensor("sqrt_32_cast_fp16")]; + tensor real_div_32_cast_fp16 = real_div(x = sub_64_cast_fp16, y = sqrt_32_cast_fp16)[name = tensor("real_div_32_cast_fp16")]; + tensor reshape_129_shape_0 = const()[name = tensor("reshape_129_shape_0"), val = tensor([2, 1280, 6, 6])]; + tensor reshape_129_cast_fp16 = reshape(shape = reshape_129_shape_0, x = real_div_32_cast_fp16)[name = tensor("reshape_129_cast_fp16")]; + tensor add_65_gamma_0_to_fp16 = const()[name = tensor("add_65_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(962299072)))]; + tensor add_65_beta_0_to_fp16 = const()[name = tensor("add_65_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(962301696)))]; + tensor add_65_epsilon_0_to_fp16 = const()[name = tensor("add_65_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_65_cast_fp16 = batch_norm(beta = add_65_beta_0_to_fp16, epsilon = add_65_epsilon_0_to_fp16, gamma = add_65_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_129_cast_fp16)[name = tensor("add_65_cast_fp16")]; + tensor input_279_cast_fp16 = silu(x = add_65_cast_fp16)[name = tensor("input_279_cast_fp16")]; + tensor var_5542 = const()[name = tensor("op_5542"), val = tensor([1, 1])]; + tensor var_5544 = const()[name = tensor("op_5544"), val = tensor([1, 1])]; + tensor hidden_states_155_pad_type_0 = const()[name = tensor("hidden_states_155_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_155_pad_0 = const()[name = tensor("hidden_states_155_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_0_resnets_2_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_2_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(962304320)))]; + tensor up_blocks_0_resnets_2_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_2_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(991795584)))]; + tensor hidden_states_155_cast_fp16 = conv(bias = up_blocks_0_resnets_2_conv2_bias_to_fp16, dilations = var_5544, groups = var_5405, pad = hidden_states_155_pad_0, pad_type = hidden_states_155_pad_type_0, strides = var_5542, weight = up_blocks_0_resnets_2_conv2_weight_to_fp16, x = input_279_cast_fp16)[name = tensor("hidden_states_155_cast_fp16")]; + tensor var_5549 = const()[name = tensor("op_5549"), val = tensor([1, 1])]; + tensor var_5551 = const()[name = tensor("op_5551"), val = tensor([1, 1])]; + tensor x_9_pad_type_0 = const()[name = tensor("x_9_pad_type_0"), val = tensor("custom")]; + tensor x_9_pad_0 = const()[name = tensor("x_9_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_0_resnets_2_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_2_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(991798208)))]; + tensor up_blocks_0_resnets_2_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_2_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998351872)))]; + tensor x_9_cast_fp16 = conv(bias = up_blocks_0_resnets_2_conv_shortcut_bias_to_fp16, dilations = var_5551, groups = var_5405, pad = x_9_pad_0, pad_type = x_9_pad_type_0, strides = var_5549, weight = up_blocks_0_resnets_2_conv_shortcut_weight_to_fp16, x = input_267_cast_fp16)[name = tensor("x_9_cast_fp16")]; + tensor input_281_cast_fp16 = add(x = x_9_cast_fp16, y = hidden_states_155_cast_fp16)[name = tensor("input_281_cast_fp16")]; + tensor input_283_scale_factor_height_0 = const()[name = tensor("input_283_scale_factor_height_0"), val = tensor(0x1p+1)]; + tensor input_283_scale_factor_width_0 = const()[name = tensor("input_283_scale_factor_width_0"), val = tensor(0x1p+1)]; + tensor input_283_cast_fp16 = upsample_nearest_neighbor(scale_factor_height = input_283_scale_factor_height_0, scale_factor_width = input_283_scale_factor_width_0, x = input_281_cast_fp16)[name = tensor("input_283_cast_fp16")]; + tensor var_5560 = const()[name = tensor("op_5560"), val = tensor([1, 1])]; + tensor var_5562 = const()[name = tensor("op_5562"), val = tensor([1, 1])]; + tensor hidden_states_157_pad_type_0 = const()[name = tensor("hidden_states_157_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_157_pad_0 = const()[name = tensor("hidden_states_157_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_0_upsamplers_0_conv_weight_to_fp16 = const()[name = tensor("up_blocks_0_upsamplers_0_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(998354496)))]; + tensor up_blocks_0_upsamplers_0_conv_bias_to_fp16 = const()[name = tensor("up_blocks_0_upsamplers_0_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1027845760)))]; + tensor hidden_states_157_cast_fp16 = conv(bias = up_blocks_0_upsamplers_0_conv_bias_to_fp16, dilations = var_5562, groups = var_5405, pad = hidden_states_157_pad_0, pad_type = hidden_states_157_pad_type_0, strides = var_5560, weight = up_blocks_0_upsamplers_0_conv_weight_to_fp16, x = input_283_cast_fp16)[name = tensor("hidden_states_157_cast_fp16")]; + tensor var_5594 = const()[name = tensor("op_5594"), val = tensor(true)]; + tensor var_5599 = const()[name = tensor("op_5599"), val = tensor(1)]; + tensor input_285_interleave_0 = const()[name = tensor("input_285_interleave_0"), val = tensor(false)]; + tensor input_285_cast_fp16 = concat(axis = var_5599, interleave = input_285_interleave_0, values = (hidden_states_157_cast_fp16, input_169_cast_fp16))[name = tensor("input_285_cast_fp16")]; + tensor reshape_132_shape_0 = const()[name = tensor("reshape_132_shape_0"), val = tensor([2, 32, 80, 12, 12])]; + tensor reshape_132_cast_fp16 = reshape(shape = reshape_132_shape_0, x = input_285_cast_fp16)[name = tensor("reshape_132_cast_fp16")]; + tensor reduce_mean_99_axes_0 = const()[name = tensor("reduce_mean_99_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_99_keep_dims_0 = const()[name = tensor("reduce_mean_99_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_99_cast_fp16 = reduce_mean(axes = reduce_mean_99_axes_0, keep_dims = reduce_mean_99_keep_dims_0, x = reshape_132_cast_fp16)[name = tensor("reduce_mean_99_cast_fp16")]; + tensor sub_66_cast_fp16 = sub(x = reshape_132_cast_fp16, y = reduce_mean_99_cast_fp16)[name = tensor("sub_66_cast_fp16")]; + tensor square_33_cast_fp16 = square(x = sub_66_cast_fp16)[name = tensor("square_33_cast_fp16")]; + tensor reduce_mean_101_axes_0 = const()[name = tensor("reduce_mean_101_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_101_keep_dims_0 = const()[name = tensor("reduce_mean_101_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_101_cast_fp16 = reduce_mean(axes = reduce_mean_101_axes_0, keep_dims = reduce_mean_101_keep_dims_0, x = square_33_cast_fp16)[name = tensor("reduce_mean_101_cast_fp16")]; + tensor add_66_y_0_to_fp16 = const()[name = tensor("add_66_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_66_cast_fp16 = add(x = reduce_mean_101_cast_fp16, y = add_66_y_0_to_fp16)[name = tensor("add_66_cast_fp16")]; + tensor sqrt_33_cast_fp16 = sqrt(x = add_66_cast_fp16)[name = tensor("sqrt_33_cast_fp16")]; + tensor real_div_33_cast_fp16 = real_div(x = sub_66_cast_fp16, y = sqrt_33_cast_fp16)[name = tensor("real_div_33_cast_fp16")]; + tensor reshape_133_shape_0 = const()[name = tensor("reshape_133_shape_0"), val = tensor([2, 2560, 12, 12])]; + tensor reshape_133_cast_fp16 = reshape(shape = reshape_133_shape_0, x = real_div_33_cast_fp16)[name = tensor("reshape_133_cast_fp16")]; + tensor add_67_gamma_0_to_fp16 = const()[name = tensor("add_67_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1027848384)))]; + tensor add_67_beta_0_to_fp16 = const()[name = tensor("add_67_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1027853568)))]; + tensor add_67_epsilon_0_to_fp16 = const()[name = tensor("add_67_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_67_cast_fp16 = batch_norm(beta = add_67_beta_0_to_fp16, epsilon = add_67_epsilon_0_to_fp16, gamma = add_67_gamma_0_to_fp16, mean = add_55_mean_0_to_fp16, variance = add_55_variance_0_to_fp16, x = reshape_133_cast_fp16)[name = tensor("add_67_cast_fp16")]; + tensor input_289_cast_fp16 = silu(x = add_67_cast_fp16)[name = tensor("input_289_cast_fp16")]; + tensor var_5628 = const()[name = tensor("op_5628"), val = tensor([1, 1])]; + tensor var_5630 = const()[name = tensor("op_5630"), val = tensor([1, 1])]; + tensor hidden_states_159_pad_type_0 = const()[name = tensor("hidden_states_159_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_159_pad_0 = const()[name = tensor("hidden_states_159_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_1_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1027858752)))]; + tensor up_blocks_1_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1086841216)))]; + tensor hidden_states_159_cast_fp16 = conv(bias = up_blocks_1_resnets_0_conv1_bias_to_fp16, dilations = var_5630, groups = var_5599, pad = hidden_states_159_pad_0, pad_type = hidden_states_159_pad_type_0, strides = var_5628, weight = up_blocks_1_resnets_0_conv1_weight_to_fp16, x = input_289_cast_fp16)[name = tensor("hidden_states_159_cast_fp16")]; + tensor var_5636 = const()[name = tensor("op_5636"), val = tensor([1, 1])]; + tensor var_5638 = const()[name = tensor("op_5638"), val = tensor([1, 1])]; + tensor temb_27_pad_type_0 = const()[name = tensor("temb_27_pad_type_0"), val = tensor("custom")]; + tensor temb_27_pad_0 = const()[name = tensor("temb_27_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1086843840)))]; + tensor up_blocks_1_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090120704)))]; + tensor temb_27_cast_fp16 = conv(bias = up_blocks_1_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_5638, groups = var_5599, pad = temb_27_pad_0, pad_type = temb_27_pad_type_0, strides = var_5636, weight = up_blocks_1_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_27_cast_fp16")]; + tensor input_293_cast_fp16 = add(x = hidden_states_159_cast_fp16, y = temb_27_cast_fp16)[name = tensor("input_293_cast_fp16")]; + tensor reshape_136_shape_0 = const()[name = tensor("reshape_136_shape_0"), val = tensor([2, 32, 40, 12, 12])]; + tensor reshape_136_cast_fp16 = reshape(shape = reshape_136_shape_0, x = input_293_cast_fp16)[name = tensor("reshape_136_cast_fp16")]; + tensor reduce_mean_102_axes_0 = const()[name = tensor("reduce_mean_102_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_102_keep_dims_0 = const()[name = tensor("reduce_mean_102_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_102_cast_fp16 = reduce_mean(axes = reduce_mean_102_axes_0, keep_dims = reduce_mean_102_keep_dims_0, x = reshape_136_cast_fp16)[name = tensor("reduce_mean_102_cast_fp16")]; + tensor sub_68_cast_fp16 = sub(x = reshape_136_cast_fp16, y = reduce_mean_102_cast_fp16)[name = tensor("sub_68_cast_fp16")]; + tensor square_34_cast_fp16 = square(x = sub_68_cast_fp16)[name = tensor("square_34_cast_fp16")]; + tensor reduce_mean_104_axes_0 = const()[name = tensor("reduce_mean_104_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_104_keep_dims_0 = const()[name = tensor("reduce_mean_104_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_104_cast_fp16 = reduce_mean(axes = reduce_mean_104_axes_0, keep_dims = reduce_mean_104_keep_dims_0, x = square_34_cast_fp16)[name = tensor("reduce_mean_104_cast_fp16")]; + tensor add_68_y_0_to_fp16 = const()[name = tensor("add_68_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_68_cast_fp16 = add(x = reduce_mean_104_cast_fp16, y = add_68_y_0_to_fp16)[name = tensor("add_68_cast_fp16")]; + tensor sqrt_34_cast_fp16 = sqrt(x = add_68_cast_fp16)[name = tensor("sqrt_34_cast_fp16")]; + tensor real_div_34_cast_fp16 = real_div(x = sub_68_cast_fp16, y = sqrt_34_cast_fp16)[name = tensor("real_div_34_cast_fp16")]; + tensor reshape_137_shape_0 = const()[name = tensor("reshape_137_shape_0"), val = tensor([2, 1280, 12, 12])]; + tensor reshape_137_cast_fp16 = reshape(shape = reshape_137_shape_0, x = real_div_34_cast_fp16)[name = tensor("reshape_137_cast_fp16")]; + tensor add_69_gamma_0_to_fp16 = const()[name = tensor("add_69_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090123328)))]; + tensor add_69_beta_0_to_fp16 = const()[name = tensor("add_69_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090125952)))]; + tensor add_69_epsilon_0_to_fp16 = const()[name = tensor("add_69_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_69_cast_fp16 = batch_norm(beta = add_69_beta_0_to_fp16, epsilon = add_69_epsilon_0_to_fp16, gamma = add_69_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_137_cast_fp16)[name = tensor("add_69_cast_fp16")]; + tensor input_297_cast_fp16 = silu(x = add_69_cast_fp16)[name = tensor("input_297_cast_fp16")]; + tensor var_5648 = const()[name = tensor("op_5648"), val = tensor([1, 1])]; + tensor var_5650 = const()[name = tensor("op_5650"), val = tensor([1, 1])]; + tensor hidden_states_161_pad_type_0 = const()[name = tensor("hidden_states_161_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_161_pad_0 = const()[name = tensor("hidden_states_161_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_1_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1090128576)))]; + tensor up_blocks_1_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1119619840)))]; + tensor hidden_states_161_cast_fp16 = conv(bias = up_blocks_1_resnets_0_conv2_bias_to_fp16, dilations = var_5650, groups = var_5599, pad = hidden_states_161_pad_0, pad_type = hidden_states_161_pad_type_0, strides = var_5648, weight = up_blocks_1_resnets_0_conv2_weight_to_fp16, x = input_297_cast_fp16)[name = tensor("hidden_states_161_cast_fp16")]; + tensor var_5655 = const()[name = tensor("op_5655"), val = tensor([1, 1])]; + tensor var_5657 = const()[name = tensor("op_5657"), val = tensor([1, 1])]; + tensor x_11_pad_type_0 = const()[name = tensor("x_11_pad_type_0"), val = tensor("custom")]; + tensor x_11_pad_0 = const()[name = tensor("x_11_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_resnets_0_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_0_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1119622464)))]; + tensor up_blocks_1_resnets_0_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_0_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1126176128)))]; + tensor x_11_cast_fp16 = conv(bias = up_blocks_1_resnets_0_conv_shortcut_bias_to_fp16, dilations = var_5657, groups = var_5599, pad = x_11_pad_0, pad_type = x_11_pad_type_0, strides = var_5655, weight = up_blocks_1_resnets_0_conv_shortcut_weight_to_fp16, x = input_285_cast_fp16)[name = tensor("x_11_cast_fp16")]; + tensor hidden_states_163_cast_fp16 = add(x = x_11_cast_fp16, y = hidden_states_161_cast_fp16)[name = tensor("hidden_states_163_cast_fp16")]; + tensor reshape_140_shape_0 = const()[name = tensor("reshape_140_shape_0"), val = tensor([2, 32, 40, 12, 12])]; + tensor reshape_140_cast_fp16 = reshape(shape = reshape_140_shape_0, x = hidden_states_163_cast_fp16)[name = tensor("reshape_140_cast_fp16")]; + tensor reduce_mean_105_axes_0 = const()[name = tensor("reduce_mean_105_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_105_keep_dims_0 = const()[name = tensor("reduce_mean_105_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_105_cast_fp16 = reduce_mean(axes = reduce_mean_105_axes_0, keep_dims = reduce_mean_105_keep_dims_0, x = reshape_140_cast_fp16)[name = tensor("reduce_mean_105_cast_fp16")]; + tensor sub_70_cast_fp16 = sub(x = reshape_140_cast_fp16, y = reduce_mean_105_cast_fp16)[name = tensor("sub_70_cast_fp16")]; + tensor square_35_cast_fp16 = square(x = sub_70_cast_fp16)[name = tensor("square_35_cast_fp16")]; + tensor reduce_mean_107_axes_0 = const()[name = tensor("reduce_mean_107_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_107_keep_dims_0 = const()[name = tensor("reduce_mean_107_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_107_cast_fp16 = reduce_mean(axes = reduce_mean_107_axes_0, keep_dims = reduce_mean_107_keep_dims_0, x = square_35_cast_fp16)[name = tensor("reduce_mean_107_cast_fp16")]; + tensor add_70_y_0_to_fp16 = const()[name = tensor("add_70_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_70_cast_fp16 = add(x = reduce_mean_107_cast_fp16, y = add_70_y_0_to_fp16)[name = tensor("add_70_cast_fp16")]; + tensor sqrt_35_cast_fp16 = sqrt(x = add_70_cast_fp16)[name = tensor("sqrt_35_cast_fp16")]; + tensor real_div_35_cast_fp16 = real_div(x = sub_70_cast_fp16, y = sqrt_35_cast_fp16)[name = tensor("real_div_35_cast_fp16")]; + tensor reshape_141_shape_0 = const()[name = tensor("reshape_141_shape_0"), val = tensor([2, 1280, 12, 12])]; + tensor reshape_141_cast_fp16 = reshape(shape = reshape_141_shape_0, x = real_div_35_cast_fp16)[name = tensor("reshape_141_cast_fp16")]; + tensor add_71_gamma_0_to_fp16 = const()[name = tensor("add_71_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1126178752)))]; + tensor add_71_beta_0_to_fp16 = const()[name = tensor("add_71_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1126181376)))]; + tensor add_71_epsilon_0_to_fp16 = const()[name = tensor("add_71_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_71_cast_fp16 = batch_norm(beta = add_71_beta_0_to_fp16, epsilon = add_71_epsilon_0_to_fp16, gamma = add_71_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_141_cast_fp16)[name = tensor("add_71_cast_fp16")]; + tensor var_5677 = const()[name = tensor("op_5677"), val = tensor([1, 1])]; + tensor var_5679 = const()[name = tensor("op_5679"), val = tensor([1, 1])]; + tensor hidden_states_165_pad_type_0 = const()[name = tensor("hidden_states_165_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_165_pad_0 = const()[name = tensor("hidden_states_165_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_proj_in_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1126184000)))]; + tensor up_blocks_1_attentions_0_proj_in_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129460864)))]; + tensor hidden_states_165_cast_fp16 = conv(bias = up_blocks_1_attentions_0_proj_in_bias_to_fp16, dilations = var_5679, groups = var_5599, pad = hidden_states_165_pad_0, pad_type = hidden_states_165_pad_type_0, strides = var_5677, weight = up_blocks_1_attentions_0_proj_in_weight_to_fp16, x = add_71_cast_fp16)[name = tensor("hidden_states_165_cast_fp16")]; + tensor var_5684 = const()[name = tensor("op_5684"), val = tensor([2, 1280, 1, 144])]; + tensor inputs_43_cast_fp16 = reshape(shape = var_5684, x = hidden_states_165_cast_fp16)[name = tensor("inputs_43_cast_fp16")]; + tensor var_5694 = const()[name = tensor("op_5694"), val = tensor([1])]; + tensor channels_mean_43_cast_fp16 = reduce_mean(axes = var_5694, keep_dims = var_5594, x = inputs_43_cast_fp16)[name = tensor("channels_mean_43_cast_fp16")]; + tensor zero_mean_43_cast_fp16 = sub(x = inputs_43_cast_fp16, y = channels_mean_43_cast_fp16)[name = tensor("zero_mean_43_cast_fp16")]; + tensor zero_mean_sq_43_cast_fp16 = mul(x = zero_mean_43_cast_fp16, y = zero_mean_43_cast_fp16)[name = tensor("zero_mean_sq_43_cast_fp16")]; + tensor var_5698 = const()[name = tensor("op_5698"), val = tensor([1])]; + tensor var_5699_cast_fp16 = reduce_mean(axes = var_5698, keep_dims = var_5594, x = zero_mean_sq_43_cast_fp16)[name = tensor("op_5699_cast_fp16")]; + tensor var_5700_to_fp16 = const()[name = tensor("op_5700_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_5701_cast_fp16 = add(x = var_5699_cast_fp16, y = var_5700_to_fp16)[name = tensor("op_5701_cast_fp16")]; + tensor denom_43_epsilon_0_to_fp16 = const()[name = tensor("denom_43_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_43_cast_fp16 = rsqrt(epsilon = denom_43_epsilon_0_to_fp16, x = var_5701_cast_fp16)[name = tensor("denom_43_cast_fp16")]; + tensor out_43_cast_fp16 = mul(x = zero_mean_43_cast_fp16, y = denom_43_cast_fp16)[name = tensor("out_43_cast_fp16")]; + tensor var_5705_to_fp16 = const()[name = tensor("op_5705_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129463488)))]; + tensor var_5706_cast_fp16 = add(x = out_43_cast_fp16, y = var_5705_to_fp16)[name = tensor("op_5706_cast_fp16")]; + tensor var_5708_to_fp16 = const()[name = tensor("op_5708_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129466112)))]; + tensor hidden_states_167_cast_fp16 = mul(x = var_5706_cast_fp16, y = var_5708_to_fp16)[name = tensor("hidden_states_167_cast_fp16")]; + tensor var_5715 = const()[name = tensor("op_5715"), val = tensor([1, 1])]; + tensor var_5717 = const()[name = tensor("op_5717"), val = tensor([1, 1])]; + tensor q_29_pad_type_0 = const()[name = tensor("q_29_pad_type_0"), val = tensor("custom")]; + tensor q_29_pad_0 = const()[name = tensor("q_29_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1129468736)))]; + tensor q_29_cast_fp16 = conv(dilations = var_5717, groups = var_5599, pad = q_29_pad_0, pad_type = q_29_pad_type_0, strides = var_5715, weight = up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_167_cast_fp16)[name = tensor("q_29_cast_fp16")]; + tensor var_5721 = const()[name = tensor("op_5721"), val = tensor([1, 1])]; + tensor var_5723 = const()[name = tensor("op_5723"), val = tensor([1, 1])]; + tensor k_57_pad_type_0 = const()[name = tensor("k_57_pad_type_0"), val = tensor("custom")]; + tensor k_57_pad_0 = const()[name = tensor("k_57_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1132745600)))]; + tensor k_57_cast_fp16 = conv(dilations = var_5723, groups = var_5599, pad = k_57_pad_0, pad_type = k_57_pad_type_0, strides = var_5721, weight = up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_167_cast_fp16)[name = tensor("k_57_cast_fp16")]; + tensor var_5727 = const()[name = tensor("op_5727"), val = tensor([1, 1])]; + tensor var_5729 = const()[name = tensor("op_5729"), val = tensor([1, 1])]; + tensor v_29_pad_type_0 = const()[name = tensor("v_29_pad_type_0"), val = tensor("custom")]; + tensor v_29_pad_0 = const()[name = tensor("v_29_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1136022464)))]; + tensor v_29_cast_fp16 = conv(dilations = var_5729, groups = var_5599, pad = v_29_pad_0, pad_type = v_29_pad_type_0, strides = var_5727, weight = up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_167_cast_fp16)[name = tensor("v_29_cast_fp16")]; + tensor var_5733_begin_0 = const()[name = tensor("op_5733_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_5733_end_0 = const()[name = tensor("op_5733_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_5733_end_mask_0 = const()[name = tensor("op_5733_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5733_cast_fp16 = slice_by_index(begin = var_5733_begin_0, end = var_5733_end_0, end_mask = var_5733_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5733_cast_fp16")]; + tensor var_5737_begin_0 = const()[name = tensor("op_5737_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_5737_end_0 = const()[name = tensor("op_5737_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_5737_end_mask_0 = const()[name = tensor("op_5737_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5737_cast_fp16 = slice_by_index(begin = var_5737_begin_0, end = var_5737_end_0, end_mask = var_5737_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5737_cast_fp16")]; + tensor var_5741_begin_0 = const()[name = tensor("op_5741_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_5741_end_0 = const()[name = tensor("op_5741_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_5741_end_mask_0 = const()[name = tensor("op_5741_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5741_cast_fp16 = slice_by_index(begin = var_5741_begin_0, end = var_5741_end_0, end_mask = var_5741_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5741_cast_fp16")]; + tensor var_5745_begin_0 = const()[name = tensor("op_5745_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_5745_end_0 = const()[name = tensor("op_5745_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_5745_end_mask_0 = const()[name = tensor("op_5745_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5745_cast_fp16 = slice_by_index(begin = var_5745_begin_0, end = var_5745_end_0, end_mask = var_5745_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5745_cast_fp16")]; + tensor var_5749_begin_0 = const()[name = tensor("op_5749_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_5749_end_0 = const()[name = tensor("op_5749_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_5749_end_mask_0 = const()[name = tensor("op_5749_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5749_cast_fp16 = slice_by_index(begin = var_5749_begin_0, end = var_5749_end_0, end_mask = var_5749_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5749_cast_fp16")]; + tensor var_5753_begin_0 = const()[name = tensor("op_5753_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_5753_end_0 = const()[name = tensor("op_5753_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_5753_end_mask_0 = const()[name = tensor("op_5753_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5753_cast_fp16 = slice_by_index(begin = var_5753_begin_0, end = var_5753_end_0, end_mask = var_5753_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5753_cast_fp16")]; + tensor var_5757_begin_0 = const()[name = tensor("op_5757_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_5757_end_0 = const()[name = tensor("op_5757_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_5757_end_mask_0 = const()[name = tensor("op_5757_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5757_cast_fp16 = slice_by_index(begin = var_5757_begin_0, end = var_5757_end_0, end_mask = var_5757_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5757_cast_fp16")]; + tensor var_5761_begin_0 = const()[name = tensor("op_5761_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_5761_end_0 = const()[name = tensor("op_5761_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_5761_end_mask_0 = const()[name = tensor("op_5761_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5761_cast_fp16 = slice_by_index(begin = var_5761_begin_0, end = var_5761_end_0, end_mask = var_5761_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5761_cast_fp16")]; + tensor var_5765_begin_0 = const()[name = tensor("op_5765_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_5765_end_0 = const()[name = tensor("op_5765_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_5765_end_mask_0 = const()[name = tensor("op_5765_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5765_cast_fp16 = slice_by_index(begin = var_5765_begin_0, end = var_5765_end_0, end_mask = var_5765_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5765_cast_fp16")]; + tensor var_5769_begin_0 = const()[name = tensor("op_5769_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_5769_end_0 = const()[name = tensor("op_5769_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_5769_end_mask_0 = const()[name = tensor("op_5769_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5769_cast_fp16 = slice_by_index(begin = var_5769_begin_0, end = var_5769_end_0, end_mask = var_5769_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5769_cast_fp16")]; + tensor var_5773_begin_0 = const()[name = tensor("op_5773_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_5773_end_0 = const()[name = tensor("op_5773_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_5773_end_mask_0 = const()[name = tensor("op_5773_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5773_cast_fp16 = slice_by_index(begin = var_5773_begin_0, end = var_5773_end_0, end_mask = var_5773_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5773_cast_fp16")]; + tensor var_5777_begin_0 = const()[name = tensor("op_5777_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_5777_end_0 = const()[name = tensor("op_5777_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_5777_end_mask_0 = const()[name = tensor("op_5777_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5777_cast_fp16 = slice_by_index(begin = var_5777_begin_0, end = var_5777_end_0, end_mask = var_5777_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5777_cast_fp16")]; + tensor var_5781_begin_0 = const()[name = tensor("op_5781_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_5781_end_0 = const()[name = tensor("op_5781_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_5781_end_mask_0 = const()[name = tensor("op_5781_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5781_cast_fp16 = slice_by_index(begin = var_5781_begin_0, end = var_5781_end_0, end_mask = var_5781_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5781_cast_fp16")]; + tensor var_5785_begin_0 = const()[name = tensor("op_5785_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_5785_end_0 = const()[name = tensor("op_5785_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_5785_end_mask_0 = const()[name = tensor("op_5785_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5785_cast_fp16 = slice_by_index(begin = var_5785_begin_0, end = var_5785_end_0, end_mask = var_5785_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5785_cast_fp16")]; + tensor var_5789_begin_0 = const()[name = tensor("op_5789_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_5789_end_0 = const()[name = tensor("op_5789_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_5789_end_mask_0 = const()[name = tensor("op_5789_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5789_cast_fp16 = slice_by_index(begin = var_5789_begin_0, end = var_5789_end_0, end_mask = var_5789_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5789_cast_fp16")]; + tensor var_5793_begin_0 = const()[name = tensor("op_5793_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_5793_end_0 = const()[name = tensor("op_5793_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_5793_end_mask_0 = const()[name = tensor("op_5793_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5793_cast_fp16 = slice_by_index(begin = var_5793_begin_0, end = var_5793_end_0, end_mask = var_5793_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5793_cast_fp16")]; + tensor var_5797_begin_0 = const()[name = tensor("op_5797_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_5797_end_0 = const()[name = tensor("op_5797_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_5797_end_mask_0 = const()[name = tensor("op_5797_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5797_cast_fp16 = slice_by_index(begin = var_5797_begin_0, end = var_5797_end_0, end_mask = var_5797_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5797_cast_fp16")]; + tensor var_5801_begin_0 = const()[name = tensor("op_5801_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_5801_end_0 = const()[name = tensor("op_5801_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_5801_end_mask_0 = const()[name = tensor("op_5801_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5801_cast_fp16 = slice_by_index(begin = var_5801_begin_0, end = var_5801_end_0, end_mask = var_5801_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5801_cast_fp16")]; + tensor var_5805_begin_0 = const()[name = tensor("op_5805_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_5805_end_0 = const()[name = tensor("op_5805_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_5805_end_mask_0 = const()[name = tensor("op_5805_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5805_cast_fp16 = slice_by_index(begin = var_5805_begin_0, end = var_5805_end_0, end_mask = var_5805_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5805_cast_fp16")]; + tensor var_5809_begin_0 = const()[name = tensor("op_5809_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_5809_end_0 = const()[name = tensor("op_5809_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_5809_end_mask_0 = const()[name = tensor("op_5809_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5809_cast_fp16 = slice_by_index(begin = var_5809_begin_0, end = var_5809_end_0, end_mask = var_5809_end_mask_0, x = q_29_cast_fp16)[name = tensor("op_5809_cast_fp16")]; + tensor k_59_perm_0 = const()[name = tensor("k_59_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_5816_begin_0 = const()[name = tensor("op_5816_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_5816_end_0 = const()[name = tensor("op_5816_end_0"), val = tensor([2, 144, 1, 64])]; + tensor var_5816_end_mask_0 = const()[name = tensor("op_5816_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_17 = transpose(perm = k_59_perm_0, x = k_57_cast_fp16)[name = tensor("transpose_17")]; + tensor var_5816_cast_fp16 = slice_by_index(begin = var_5816_begin_0, end = var_5816_end_0, end_mask = var_5816_end_mask_0, x = transpose_17)[name = tensor("op_5816_cast_fp16")]; + tensor var_5820_begin_0 = const()[name = tensor("op_5820_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_5820_end_0 = const()[name = tensor("op_5820_end_0"), val = tensor([2, 144, 1, 128])]; + tensor var_5820_end_mask_0 = const()[name = tensor("op_5820_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5820_cast_fp16 = slice_by_index(begin = var_5820_begin_0, end = var_5820_end_0, end_mask = var_5820_end_mask_0, x = transpose_17)[name = tensor("op_5820_cast_fp16")]; + tensor var_5824_begin_0 = const()[name = tensor("op_5824_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_5824_end_0 = const()[name = tensor("op_5824_end_0"), val = tensor([2, 144, 1, 192])]; + tensor var_5824_end_mask_0 = const()[name = tensor("op_5824_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5824_cast_fp16 = slice_by_index(begin = var_5824_begin_0, end = var_5824_end_0, end_mask = var_5824_end_mask_0, x = transpose_17)[name = tensor("op_5824_cast_fp16")]; + tensor var_5828_begin_0 = const()[name = tensor("op_5828_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_5828_end_0 = const()[name = tensor("op_5828_end_0"), val = tensor([2, 144, 1, 256])]; + tensor var_5828_end_mask_0 = const()[name = tensor("op_5828_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5828_cast_fp16 = slice_by_index(begin = var_5828_begin_0, end = var_5828_end_0, end_mask = var_5828_end_mask_0, x = transpose_17)[name = tensor("op_5828_cast_fp16")]; + tensor var_5832_begin_0 = const()[name = tensor("op_5832_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_5832_end_0 = const()[name = tensor("op_5832_end_0"), val = tensor([2, 144, 1, 320])]; + tensor var_5832_end_mask_0 = const()[name = tensor("op_5832_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5832_cast_fp16 = slice_by_index(begin = var_5832_begin_0, end = var_5832_end_0, end_mask = var_5832_end_mask_0, x = transpose_17)[name = tensor("op_5832_cast_fp16")]; + tensor var_5836_begin_0 = const()[name = tensor("op_5836_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_5836_end_0 = const()[name = tensor("op_5836_end_0"), val = tensor([2, 144, 1, 384])]; + tensor var_5836_end_mask_0 = const()[name = tensor("op_5836_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5836_cast_fp16 = slice_by_index(begin = var_5836_begin_0, end = var_5836_end_0, end_mask = var_5836_end_mask_0, x = transpose_17)[name = tensor("op_5836_cast_fp16")]; + tensor var_5840_begin_0 = const()[name = tensor("op_5840_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_5840_end_0 = const()[name = tensor("op_5840_end_0"), val = tensor([2, 144, 1, 448])]; + tensor var_5840_end_mask_0 = const()[name = tensor("op_5840_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5840_cast_fp16 = slice_by_index(begin = var_5840_begin_0, end = var_5840_end_0, end_mask = var_5840_end_mask_0, x = transpose_17)[name = tensor("op_5840_cast_fp16")]; + tensor var_5844_begin_0 = const()[name = tensor("op_5844_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_5844_end_0 = const()[name = tensor("op_5844_end_0"), val = tensor([2, 144, 1, 512])]; + tensor var_5844_end_mask_0 = const()[name = tensor("op_5844_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5844_cast_fp16 = slice_by_index(begin = var_5844_begin_0, end = var_5844_end_0, end_mask = var_5844_end_mask_0, x = transpose_17)[name = tensor("op_5844_cast_fp16")]; + tensor var_5848_begin_0 = const()[name = tensor("op_5848_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_5848_end_0 = const()[name = tensor("op_5848_end_0"), val = tensor([2, 144, 1, 576])]; + tensor var_5848_end_mask_0 = const()[name = tensor("op_5848_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5848_cast_fp16 = slice_by_index(begin = var_5848_begin_0, end = var_5848_end_0, end_mask = var_5848_end_mask_0, x = transpose_17)[name = tensor("op_5848_cast_fp16")]; + tensor var_5852_begin_0 = const()[name = tensor("op_5852_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_5852_end_0 = const()[name = tensor("op_5852_end_0"), val = tensor([2, 144, 1, 640])]; + tensor var_5852_end_mask_0 = const()[name = tensor("op_5852_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5852_cast_fp16 = slice_by_index(begin = var_5852_begin_0, end = var_5852_end_0, end_mask = var_5852_end_mask_0, x = transpose_17)[name = tensor("op_5852_cast_fp16")]; + tensor var_5856_begin_0 = const()[name = tensor("op_5856_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_5856_end_0 = const()[name = tensor("op_5856_end_0"), val = tensor([2, 144, 1, 704])]; + tensor var_5856_end_mask_0 = const()[name = tensor("op_5856_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5856_cast_fp16 = slice_by_index(begin = var_5856_begin_0, end = var_5856_end_0, end_mask = var_5856_end_mask_0, x = transpose_17)[name = tensor("op_5856_cast_fp16")]; + tensor var_5860_begin_0 = const()[name = tensor("op_5860_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_5860_end_0 = const()[name = tensor("op_5860_end_0"), val = tensor([2, 144, 1, 768])]; + tensor var_5860_end_mask_0 = const()[name = tensor("op_5860_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5860_cast_fp16 = slice_by_index(begin = var_5860_begin_0, end = var_5860_end_0, end_mask = var_5860_end_mask_0, x = transpose_17)[name = tensor("op_5860_cast_fp16")]; + tensor var_5864_begin_0 = const()[name = tensor("op_5864_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_5864_end_0 = const()[name = tensor("op_5864_end_0"), val = tensor([2, 144, 1, 832])]; + tensor var_5864_end_mask_0 = const()[name = tensor("op_5864_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5864_cast_fp16 = slice_by_index(begin = var_5864_begin_0, end = var_5864_end_0, end_mask = var_5864_end_mask_0, x = transpose_17)[name = tensor("op_5864_cast_fp16")]; + tensor var_5868_begin_0 = const()[name = tensor("op_5868_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_5868_end_0 = const()[name = tensor("op_5868_end_0"), val = tensor([2, 144, 1, 896])]; + tensor var_5868_end_mask_0 = const()[name = tensor("op_5868_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5868_cast_fp16 = slice_by_index(begin = var_5868_begin_0, end = var_5868_end_0, end_mask = var_5868_end_mask_0, x = transpose_17)[name = tensor("op_5868_cast_fp16")]; + tensor var_5872_begin_0 = const()[name = tensor("op_5872_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_5872_end_0 = const()[name = tensor("op_5872_end_0"), val = tensor([2, 144, 1, 960])]; + tensor var_5872_end_mask_0 = const()[name = tensor("op_5872_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5872_cast_fp16 = slice_by_index(begin = var_5872_begin_0, end = var_5872_end_0, end_mask = var_5872_end_mask_0, x = transpose_17)[name = tensor("op_5872_cast_fp16")]; + tensor var_5876_begin_0 = const()[name = tensor("op_5876_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_5876_end_0 = const()[name = tensor("op_5876_end_0"), val = tensor([2, 144, 1, 1024])]; + tensor var_5876_end_mask_0 = const()[name = tensor("op_5876_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5876_cast_fp16 = slice_by_index(begin = var_5876_begin_0, end = var_5876_end_0, end_mask = var_5876_end_mask_0, x = transpose_17)[name = tensor("op_5876_cast_fp16")]; + tensor var_5880_begin_0 = const()[name = tensor("op_5880_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_5880_end_0 = const()[name = tensor("op_5880_end_0"), val = tensor([2, 144, 1, 1088])]; + tensor var_5880_end_mask_0 = const()[name = tensor("op_5880_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5880_cast_fp16 = slice_by_index(begin = var_5880_begin_0, end = var_5880_end_0, end_mask = var_5880_end_mask_0, x = transpose_17)[name = tensor("op_5880_cast_fp16")]; + tensor var_5884_begin_0 = const()[name = tensor("op_5884_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_5884_end_0 = const()[name = tensor("op_5884_end_0"), val = tensor([2, 144, 1, 1152])]; + tensor var_5884_end_mask_0 = const()[name = tensor("op_5884_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5884_cast_fp16 = slice_by_index(begin = var_5884_begin_0, end = var_5884_end_0, end_mask = var_5884_end_mask_0, x = transpose_17)[name = tensor("op_5884_cast_fp16")]; + tensor var_5888_begin_0 = const()[name = tensor("op_5888_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_5888_end_0 = const()[name = tensor("op_5888_end_0"), val = tensor([2, 144, 1, 1216])]; + tensor var_5888_end_mask_0 = const()[name = tensor("op_5888_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5888_cast_fp16 = slice_by_index(begin = var_5888_begin_0, end = var_5888_end_0, end_mask = var_5888_end_mask_0, x = transpose_17)[name = tensor("op_5888_cast_fp16")]; + tensor var_5892_begin_0 = const()[name = tensor("op_5892_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_5892_end_0 = const()[name = tensor("op_5892_end_0"), val = tensor([2, 144, 1, 1280])]; + tensor var_5892_end_mask_0 = const()[name = tensor("op_5892_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_5892_cast_fp16 = slice_by_index(begin = var_5892_begin_0, end = var_5892_end_0, end_mask = var_5892_end_mask_0, x = transpose_17)[name = tensor("op_5892_cast_fp16")]; + tensor var_5894_begin_0 = const()[name = tensor("op_5894_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_5894_end_0 = const()[name = tensor("op_5894_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_5894_end_mask_0 = const()[name = tensor("op_5894_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5894_cast_fp16 = slice_by_index(begin = var_5894_begin_0, end = var_5894_end_0, end_mask = var_5894_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5894_cast_fp16")]; + tensor var_5898_begin_0 = const()[name = tensor("op_5898_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_5898_end_0 = const()[name = tensor("op_5898_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_5898_end_mask_0 = const()[name = tensor("op_5898_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5898_cast_fp16 = slice_by_index(begin = var_5898_begin_0, end = var_5898_end_0, end_mask = var_5898_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5898_cast_fp16")]; + tensor var_5902_begin_0 = const()[name = tensor("op_5902_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_5902_end_0 = const()[name = tensor("op_5902_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_5902_end_mask_0 = const()[name = tensor("op_5902_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5902_cast_fp16 = slice_by_index(begin = var_5902_begin_0, end = var_5902_end_0, end_mask = var_5902_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5902_cast_fp16")]; + tensor var_5906_begin_0 = const()[name = tensor("op_5906_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_5906_end_0 = const()[name = tensor("op_5906_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_5906_end_mask_0 = const()[name = tensor("op_5906_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5906_cast_fp16 = slice_by_index(begin = var_5906_begin_0, end = var_5906_end_0, end_mask = var_5906_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5906_cast_fp16")]; + tensor var_5910_begin_0 = const()[name = tensor("op_5910_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_5910_end_0 = const()[name = tensor("op_5910_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_5910_end_mask_0 = const()[name = tensor("op_5910_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5910_cast_fp16 = slice_by_index(begin = var_5910_begin_0, end = var_5910_end_0, end_mask = var_5910_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5910_cast_fp16")]; + tensor var_5914_begin_0 = const()[name = tensor("op_5914_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_5914_end_0 = const()[name = tensor("op_5914_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_5914_end_mask_0 = const()[name = tensor("op_5914_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5914_cast_fp16 = slice_by_index(begin = var_5914_begin_0, end = var_5914_end_0, end_mask = var_5914_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5914_cast_fp16")]; + tensor var_5918_begin_0 = const()[name = tensor("op_5918_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_5918_end_0 = const()[name = tensor("op_5918_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_5918_end_mask_0 = const()[name = tensor("op_5918_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5918_cast_fp16 = slice_by_index(begin = var_5918_begin_0, end = var_5918_end_0, end_mask = var_5918_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5918_cast_fp16")]; + tensor var_5922_begin_0 = const()[name = tensor("op_5922_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_5922_end_0 = const()[name = tensor("op_5922_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_5922_end_mask_0 = const()[name = tensor("op_5922_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5922_cast_fp16 = slice_by_index(begin = var_5922_begin_0, end = var_5922_end_0, end_mask = var_5922_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5922_cast_fp16")]; + tensor var_5926_begin_0 = const()[name = tensor("op_5926_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_5926_end_0 = const()[name = tensor("op_5926_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_5926_end_mask_0 = const()[name = tensor("op_5926_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5926_cast_fp16 = slice_by_index(begin = var_5926_begin_0, end = var_5926_end_0, end_mask = var_5926_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5926_cast_fp16")]; + tensor var_5930_begin_0 = const()[name = tensor("op_5930_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_5930_end_0 = const()[name = tensor("op_5930_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_5930_end_mask_0 = const()[name = tensor("op_5930_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5930_cast_fp16 = slice_by_index(begin = var_5930_begin_0, end = var_5930_end_0, end_mask = var_5930_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5930_cast_fp16")]; + tensor var_5934_begin_0 = const()[name = tensor("op_5934_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_5934_end_0 = const()[name = tensor("op_5934_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_5934_end_mask_0 = const()[name = tensor("op_5934_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5934_cast_fp16 = slice_by_index(begin = var_5934_begin_0, end = var_5934_end_0, end_mask = var_5934_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5934_cast_fp16")]; + tensor var_5938_begin_0 = const()[name = tensor("op_5938_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_5938_end_0 = const()[name = tensor("op_5938_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_5938_end_mask_0 = const()[name = tensor("op_5938_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5938_cast_fp16 = slice_by_index(begin = var_5938_begin_0, end = var_5938_end_0, end_mask = var_5938_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5938_cast_fp16")]; + tensor var_5942_begin_0 = const()[name = tensor("op_5942_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_5942_end_0 = const()[name = tensor("op_5942_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_5942_end_mask_0 = const()[name = tensor("op_5942_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5942_cast_fp16 = slice_by_index(begin = var_5942_begin_0, end = var_5942_end_0, end_mask = var_5942_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5942_cast_fp16")]; + tensor var_5946_begin_0 = const()[name = tensor("op_5946_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_5946_end_0 = const()[name = tensor("op_5946_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_5946_end_mask_0 = const()[name = tensor("op_5946_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5946_cast_fp16 = slice_by_index(begin = var_5946_begin_0, end = var_5946_end_0, end_mask = var_5946_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5946_cast_fp16")]; + tensor var_5950_begin_0 = const()[name = tensor("op_5950_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_5950_end_0 = const()[name = tensor("op_5950_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_5950_end_mask_0 = const()[name = tensor("op_5950_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5950_cast_fp16 = slice_by_index(begin = var_5950_begin_0, end = var_5950_end_0, end_mask = var_5950_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5950_cast_fp16")]; + tensor var_5954_begin_0 = const()[name = tensor("op_5954_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_5954_end_0 = const()[name = tensor("op_5954_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_5954_end_mask_0 = const()[name = tensor("op_5954_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5954_cast_fp16 = slice_by_index(begin = var_5954_begin_0, end = var_5954_end_0, end_mask = var_5954_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5954_cast_fp16")]; + tensor var_5958_begin_0 = const()[name = tensor("op_5958_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_5958_end_0 = const()[name = tensor("op_5958_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_5958_end_mask_0 = const()[name = tensor("op_5958_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5958_cast_fp16 = slice_by_index(begin = var_5958_begin_0, end = var_5958_end_0, end_mask = var_5958_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5958_cast_fp16")]; + tensor var_5962_begin_0 = const()[name = tensor("op_5962_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_5962_end_0 = const()[name = tensor("op_5962_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_5962_end_mask_0 = const()[name = tensor("op_5962_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5962_cast_fp16 = slice_by_index(begin = var_5962_begin_0, end = var_5962_end_0, end_mask = var_5962_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5962_cast_fp16")]; + tensor var_5966_begin_0 = const()[name = tensor("op_5966_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_5966_end_0 = const()[name = tensor("op_5966_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_5966_end_mask_0 = const()[name = tensor("op_5966_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5966_cast_fp16 = slice_by_index(begin = var_5966_begin_0, end = var_5966_end_0, end_mask = var_5966_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5966_cast_fp16")]; + tensor var_5970_begin_0 = const()[name = tensor("op_5970_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_5970_end_0 = const()[name = tensor("op_5970_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_5970_end_mask_0 = const()[name = tensor("op_5970_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_5970_cast_fp16 = slice_by_index(begin = var_5970_begin_0, end = var_5970_end_0, end_mask = var_5970_end_mask_0, x = v_29_cast_fp16)[name = tensor("op_5970_cast_fp16")]; + tensor var_5974_equation_0 = const()[name = tensor("op_5974_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5974_cast_fp16 = einsum(equation = var_5974_equation_0, values = (var_5816_cast_fp16, var_5733_cast_fp16))[name = tensor("op_5974_cast_fp16")]; + tensor var_5975_to_fp16 = const()[name = tensor("op_5975_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_361_cast_fp16 = mul(x = var_5974_cast_fp16, y = var_5975_to_fp16)[name = tensor("aw_361_cast_fp16")]; + tensor var_5978_equation_0 = const()[name = tensor("op_5978_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5978_cast_fp16 = einsum(equation = var_5978_equation_0, values = (var_5820_cast_fp16, var_5737_cast_fp16))[name = tensor("op_5978_cast_fp16")]; + tensor var_5979_to_fp16 = const()[name = tensor("op_5979_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_363_cast_fp16 = mul(x = var_5978_cast_fp16, y = var_5979_to_fp16)[name = tensor("aw_363_cast_fp16")]; + tensor var_5982_equation_0 = const()[name = tensor("op_5982_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5982_cast_fp16 = einsum(equation = var_5982_equation_0, values = (var_5824_cast_fp16, var_5741_cast_fp16))[name = tensor("op_5982_cast_fp16")]; + tensor var_5983_to_fp16 = const()[name = tensor("op_5983_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_365_cast_fp16 = mul(x = var_5982_cast_fp16, y = var_5983_to_fp16)[name = tensor("aw_365_cast_fp16")]; + tensor var_5986_equation_0 = const()[name = tensor("op_5986_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5986_cast_fp16 = einsum(equation = var_5986_equation_0, values = (var_5828_cast_fp16, var_5745_cast_fp16))[name = tensor("op_5986_cast_fp16")]; + tensor var_5987_to_fp16 = const()[name = tensor("op_5987_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_367_cast_fp16 = mul(x = var_5986_cast_fp16, y = var_5987_to_fp16)[name = tensor("aw_367_cast_fp16")]; + tensor var_5990_equation_0 = const()[name = tensor("op_5990_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5990_cast_fp16 = einsum(equation = var_5990_equation_0, values = (var_5832_cast_fp16, var_5749_cast_fp16))[name = tensor("op_5990_cast_fp16")]; + tensor var_5991_to_fp16 = const()[name = tensor("op_5991_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_369_cast_fp16 = mul(x = var_5990_cast_fp16, y = var_5991_to_fp16)[name = tensor("aw_369_cast_fp16")]; + tensor var_5994_equation_0 = const()[name = tensor("op_5994_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5994_cast_fp16 = einsum(equation = var_5994_equation_0, values = (var_5836_cast_fp16, var_5753_cast_fp16))[name = tensor("op_5994_cast_fp16")]; + tensor var_5995_to_fp16 = const()[name = tensor("op_5995_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_371_cast_fp16 = mul(x = var_5994_cast_fp16, y = var_5995_to_fp16)[name = tensor("aw_371_cast_fp16")]; + tensor var_5998_equation_0 = const()[name = tensor("op_5998_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_5998_cast_fp16 = einsum(equation = var_5998_equation_0, values = (var_5840_cast_fp16, var_5757_cast_fp16))[name = tensor("op_5998_cast_fp16")]; + tensor var_5999_to_fp16 = const()[name = tensor("op_5999_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_373_cast_fp16 = mul(x = var_5998_cast_fp16, y = var_5999_to_fp16)[name = tensor("aw_373_cast_fp16")]; + tensor var_6002_equation_0 = const()[name = tensor("op_6002_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6002_cast_fp16 = einsum(equation = var_6002_equation_0, values = (var_5844_cast_fp16, var_5761_cast_fp16))[name = tensor("op_6002_cast_fp16")]; + tensor var_6003_to_fp16 = const()[name = tensor("op_6003_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_375_cast_fp16 = mul(x = var_6002_cast_fp16, y = var_6003_to_fp16)[name = tensor("aw_375_cast_fp16")]; + tensor var_6006_equation_0 = const()[name = tensor("op_6006_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6006_cast_fp16 = einsum(equation = var_6006_equation_0, values = (var_5848_cast_fp16, var_5765_cast_fp16))[name = tensor("op_6006_cast_fp16")]; + tensor var_6007_to_fp16 = const()[name = tensor("op_6007_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_377_cast_fp16 = mul(x = var_6006_cast_fp16, y = var_6007_to_fp16)[name = tensor("aw_377_cast_fp16")]; + tensor var_6010_equation_0 = const()[name = tensor("op_6010_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6010_cast_fp16 = einsum(equation = var_6010_equation_0, values = (var_5852_cast_fp16, var_5769_cast_fp16))[name = tensor("op_6010_cast_fp16")]; + tensor var_6011_to_fp16 = const()[name = tensor("op_6011_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_379_cast_fp16 = mul(x = var_6010_cast_fp16, y = var_6011_to_fp16)[name = tensor("aw_379_cast_fp16")]; + tensor var_6014_equation_0 = const()[name = tensor("op_6014_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6014_cast_fp16 = einsum(equation = var_6014_equation_0, values = (var_5856_cast_fp16, var_5773_cast_fp16))[name = tensor("op_6014_cast_fp16")]; + tensor var_6015_to_fp16 = const()[name = tensor("op_6015_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_381_cast_fp16 = mul(x = var_6014_cast_fp16, y = var_6015_to_fp16)[name = tensor("aw_381_cast_fp16")]; + tensor var_6018_equation_0 = const()[name = tensor("op_6018_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6018_cast_fp16 = einsum(equation = var_6018_equation_0, values = (var_5860_cast_fp16, var_5777_cast_fp16))[name = tensor("op_6018_cast_fp16")]; + tensor var_6019_to_fp16 = const()[name = tensor("op_6019_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_383_cast_fp16 = mul(x = var_6018_cast_fp16, y = var_6019_to_fp16)[name = tensor("aw_383_cast_fp16")]; + tensor var_6022_equation_0 = const()[name = tensor("op_6022_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6022_cast_fp16 = einsum(equation = var_6022_equation_0, values = (var_5864_cast_fp16, var_5781_cast_fp16))[name = tensor("op_6022_cast_fp16")]; + tensor var_6023_to_fp16 = const()[name = tensor("op_6023_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_385_cast_fp16 = mul(x = var_6022_cast_fp16, y = var_6023_to_fp16)[name = tensor("aw_385_cast_fp16")]; + tensor var_6026_equation_0 = const()[name = tensor("op_6026_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6026_cast_fp16 = einsum(equation = var_6026_equation_0, values = (var_5868_cast_fp16, var_5785_cast_fp16))[name = tensor("op_6026_cast_fp16")]; + tensor var_6027_to_fp16 = const()[name = tensor("op_6027_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_387_cast_fp16 = mul(x = var_6026_cast_fp16, y = var_6027_to_fp16)[name = tensor("aw_387_cast_fp16")]; + tensor var_6030_equation_0 = const()[name = tensor("op_6030_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6030_cast_fp16 = einsum(equation = var_6030_equation_0, values = (var_5872_cast_fp16, var_5789_cast_fp16))[name = tensor("op_6030_cast_fp16")]; + tensor var_6031_to_fp16 = const()[name = tensor("op_6031_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_389_cast_fp16 = mul(x = var_6030_cast_fp16, y = var_6031_to_fp16)[name = tensor("aw_389_cast_fp16")]; + tensor var_6034_equation_0 = const()[name = tensor("op_6034_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6034_cast_fp16 = einsum(equation = var_6034_equation_0, values = (var_5876_cast_fp16, var_5793_cast_fp16))[name = tensor("op_6034_cast_fp16")]; + tensor var_6035_to_fp16 = const()[name = tensor("op_6035_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_391_cast_fp16 = mul(x = var_6034_cast_fp16, y = var_6035_to_fp16)[name = tensor("aw_391_cast_fp16")]; + tensor var_6038_equation_0 = const()[name = tensor("op_6038_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6038_cast_fp16 = einsum(equation = var_6038_equation_0, values = (var_5880_cast_fp16, var_5797_cast_fp16))[name = tensor("op_6038_cast_fp16")]; + tensor var_6039_to_fp16 = const()[name = tensor("op_6039_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_393_cast_fp16 = mul(x = var_6038_cast_fp16, y = var_6039_to_fp16)[name = tensor("aw_393_cast_fp16")]; + tensor var_6042_equation_0 = const()[name = tensor("op_6042_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6042_cast_fp16 = einsum(equation = var_6042_equation_0, values = (var_5884_cast_fp16, var_5801_cast_fp16))[name = tensor("op_6042_cast_fp16")]; + tensor var_6043_to_fp16 = const()[name = tensor("op_6043_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_395_cast_fp16 = mul(x = var_6042_cast_fp16, y = var_6043_to_fp16)[name = tensor("aw_395_cast_fp16")]; + tensor var_6046_equation_0 = const()[name = tensor("op_6046_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6046_cast_fp16 = einsum(equation = var_6046_equation_0, values = (var_5888_cast_fp16, var_5805_cast_fp16))[name = tensor("op_6046_cast_fp16")]; + tensor var_6047_to_fp16 = const()[name = tensor("op_6047_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_397_cast_fp16 = mul(x = var_6046_cast_fp16, y = var_6047_to_fp16)[name = tensor("aw_397_cast_fp16")]; + tensor var_6050_equation_0 = const()[name = tensor("op_6050_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6050_cast_fp16 = einsum(equation = var_6050_equation_0, values = (var_5892_cast_fp16, var_5809_cast_fp16))[name = tensor("op_6050_cast_fp16")]; + tensor var_6051_to_fp16 = const()[name = tensor("op_6051_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_399_cast_fp16 = mul(x = var_6050_cast_fp16, y = var_6051_to_fp16)[name = tensor("aw_399_cast_fp16")]; + tensor var_6053_cast_fp16 = softmax(axis = var_5599, x = aw_361_cast_fp16)[name = tensor("op_6053_cast_fp16")]; + tensor var_6054_cast_fp16 = softmax(axis = var_5599, x = aw_363_cast_fp16)[name = tensor("op_6054_cast_fp16")]; + tensor var_6055_cast_fp16 = softmax(axis = var_5599, x = aw_365_cast_fp16)[name = tensor("op_6055_cast_fp16")]; + tensor var_6056_cast_fp16 = softmax(axis = var_5599, x = aw_367_cast_fp16)[name = tensor("op_6056_cast_fp16")]; + tensor var_6057_cast_fp16 = softmax(axis = var_5599, x = aw_369_cast_fp16)[name = tensor("op_6057_cast_fp16")]; + tensor var_6058_cast_fp16 = softmax(axis = var_5599, x = aw_371_cast_fp16)[name = tensor("op_6058_cast_fp16")]; + tensor var_6059_cast_fp16 = softmax(axis = var_5599, x = aw_373_cast_fp16)[name = tensor("op_6059_cast_fp16")]; + tensor var_6060_cast_fp16 = softmax(axis = var_5599, x = aw_375_cast_fp16)[name = tensor("op_6060_cast_fp16")]; + tensor var_6061_cast_fp16 = softmax(axis = var_5599, x = aw_377_cast_fp16)[name = tensor("op_6061_cast_fp16")]; + tensor var_6062_cast_fp16 = softmax(axis = var_5599, x = aw_379_cast_fp16)[name = tensor("op_6062_cast_fp16")]; + tensor var_6063_cast_fp16 = softmax(axis = var_5599, x = aw_381_cast_fp16)[name = tensor("op_6063_cast_fp16")]; + tensor var_6064_cast_fp16 = softmax(axis = var_5599, x = aw_383_cast_fp16)[name = tensor("op_6064_cast_fp16")]; + tensor var_6065_cast_fp16 = softmax(axis = var_5599, x = aw_385_cast_fp16)[name = tensor("op_6065_cast_fp16")]; + tensor var_6066_cast_fp16 = softmax(axis = var_5599, x = aw_387_cast_fp16)[name = tensor("op_6066_cast_fp16")]; + tensor var_6067_cast_fp16 = softmax(axis = var_5599, x = aw_389_cast_fp16)[name = tensor("op_6067_cast_fp16")]; + tensor var_6068_cast_fp16 = softmax(axis = var_5599, x = aw_391_cast_fp16)[name = tensor("op_6068_cast_fp16")]; + tensor var_6069_cast_fp16 = softmax(axis = var_5599, x = aw_393_cast_fp16)[name = tensor("op_6069_cast_fp16")]; + tensor var_6070_cast_fp16 = softmax(axis = var_5599, x = aw_395_cast_fp16)[name = tensor("op_6070_cast_fp16")]; + tensor var_6071_cast_fp16 = softmax(axis = var_5599, x = aw_397_cast_fp16)[name = tensor("op_6071_cast_fp16")]; + tensor var_6072_cast_fp16 = softmax(axis = var_5599, x = aw_399_cast_fp16)[name = tensor("op_6072_cast_fp16")]; + tensor var_6074_equation_0 = const()[name = tensor("op_6074_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6074_cast_fp16 = einsum(equation = var_6074_equation_0, values = (var_5894_cast_fp16, var_6053_cast_fp16))[name = tensor("op_6074_cast_fp16")]; + tensor var_6076_equation_0 = const()[name = tensor("op_6076_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6076_cast_fp16 = einsum(equation = var_6076_equation_0, values = (var_5898_cast_fp16, var_6054_cast_fp16))[name = tensor("op_6076_cast_fp16")]; + tensor var_6078_equation_0 = const()[name = tensor("op_6078_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6078_cast_fp16 = einsum(equation = var_6078_equation_0, values = (var_5902_cast_fp16, var_6055_cast_fp16))[name = tensor("op_6078_cast_fp16")]; + tensor var_6080_equation_0 = const()[name = tensor("op_6080_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6080_cast_fp16 = einsum(equation = var_6080_equation_0, values = (var_5906_cast_fp16, var_6056_cast_fp16))[name = tensor("op_6080_cast_fp16")]; + tensor var_6082_equation_0 = const()[name = tensor("op_6082_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6082_cast_fp16 = einsum(equation = var_6082_equation_0, values = (var_5910_cast_fp16, var_6057_cast_fp16))[name = tensor("op_6082_cast_fp16")]; + tensor var_6084_equation_0 = const()[name = tensor("op_6084_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6084_cast_fp16 = einsum(equation = var_6084_equation_0, values = (var_5914_cast_fp16, var_6058_cast_fp16))[name = tensor("op_6084_cast_fp16")]; + tensor var_6086_equation_0 = const()[name = tensor("op_6086_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6086_cast_fp16 = einsum(equation = var_6086_equation_0, values = (var_5918_cast_fp16, var_6059_cast_fp16))[name = tensor("op_6086_cast_fp16")]; + tensor var_6088_equation_0 = const()[name = tensor("op_6088_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6088_cast_fp16 = einsum(equation = var_6088_equation_0, values = (var_5922_cast_fp16, var_6060_cast_fp16))[name = tensor("op_6088_cast_fp16")]; + tensor var_6090_equation_0 = const()[name = tensor("op_6090_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6090_cast_fp16 = einsum(equation = var_6090_equation_0, values = (var_5926_cast_fp16, var_6061_cast_fp16))[name = tensor("op_6090_cast_fp16")]; + tensor var_6092_equation_0 = const()[name = tensor("op_6092_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6092_cast_fp16 = einsum(equation = var_6092_equation_0, values = (var_5930_cast_fp16, var_6062_cast_fp16))[name = tensor("op_6092_cast_fp16")]; + tensor var_6094_equation_0 = const()[name = tensor("op_6094_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6094_cast_fp16 = einsum(equation = var_6094_equation_0, values = (var_5934_cast_fp16, var_6063_cast_fp16))[name = tensor("op_6094_cast_fp16")]; + tensor var_6096_equation_0 = const()[name = tensor("op_6096_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6096_cast_fp16 = einsum(equation = var_6096_equation_0, values = (var_5938_cast_fp16, var_6064_cast_fp16))[name = tensor("op_6096_cast_fp16")]; + tensor var_6098_equation_0 = const()[name = tensor("op_6098_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6098_cast_fp16 = einsum(equation = var_6098_equation_0, values = (var_5942_cast_fp16, var_6065_cast_fp16))[name = tensor("op_6098_cast_fp16")]; + tensor var_6100_equation_0 = const()[name = tensor("op_6100_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6100_cast_fp16 = einsum(equation = var_6100_equation_0, values = (var_5946_cast_fp16, var_6066_cast_fp16))[name = tensor("op_6100_cast_fp16")]; + tensor var_6102_equation_0 = const()[name = tensor("op_6102_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6102_cast_fp16 = einsum(equation = var_6102_equation_0, values = (var_5950_cast_fp16, var_6067_cast_fp16))[name = tensor("op_6102_cast_fp16")]; + tensor var_6104_equation_0 = const()[name = tensor("op_6104_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6104_cast_fp16 = einsum(equation = var_6104_equation_0, values = (var_5954_cast_fp16, var_6068_cast_fp16))[name = tensor("op_6104_cast_fp16")]; + tensor var_6106_equation_0 = const()[name = tensor("op_6106_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6106_cast_fp16 = einsum(equation = var_6106_equation_0, values = (var_5958_cast_fp16, var_6069_cast_fp16))[name = tensor("op_6106_cast_fp16")]; + tensor var_6108_equation_0 = const()[name = tensor("op_6108_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6108_cast_fp16 = einsum(equation = var_6108_equation_0, values = (var_5962_cast_fp16, var_6070_cast_fp16))[name = tensor("op_6108_cast_fp16")]; + tensor var_6110_equation_0 = const()[name = tensor("op_6110_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6110_cast_fp16 = einsum(equation = var_6110_equation_0, values = (var_5966_cast_fp16, var_6071_cast_fp16))[name = tensor("op_6110_cast_fp16")]; + tensor var_6112_equation_0 = const()[name = tensor("op_6112_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6112_cast_fp16 = einsum(equation = var_6112_equation_0, values = (var_5970_cast_fp16, var_6072_cast_fp16))[name = tensor("op_6112_cast_fp16")]; + tensor input_301_interleave_0 = const()[name = tensor("input_301_interleave_0"), val = tensor(false)]; + tensor input_301_cast_fp16 = concat(axis = var_5599, interleave = input_301_interleave_0, values = (var_6074_cast_fp16, var_6076_cast_fp16, var_6078_cast_fp16, var_6080_cast_fp16, var_6082_cast_fp16, var_6084_cast_fp16, var_6086_cast_fp16, var_6088_cast_fp16, var_6090_cast_fp16, var_6092_cast_fp16, var_6094_cast_fp16, var_6096_cast_fp16, var_6098_cast_fp16, var_6100_cast_fp16, var_6102_cast_fp16, var_6104_cast_fp16, var_6106_cast_fp16, var_6108_cast_fp16, var_6110_cast_fp16, var_6112_cast_fp16))[name = tensor("input_301_cast_fp16")]; + tensor var_6118 = const()[name = tensor("op_6118"), val = tensor([1, 1])]; + tensor var_6120 = const()[name = tensor("op_6120"), val = tensor([1, 1])]; + tensor var_6122_pad_type_0 = const()[name = tensor("op_6122_pad_type_0"), val = tensor("custom")]; + tensor var_6122_pad_0 = const()[name = tensor("op_6122_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1139299328)))]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1142576192)))]; + tensor var_6122_cast_fp16 = conv(bias = up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_6120, groups = var_5599, pad = var_6122_pad_0, pad_type = var_6122_pad_type_0, strides = var_6118, weight = up_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_301_cast_fp16)[name = tensor("op_6122_cast_fp16")]; + tensor inputs_45_cast_fp16 = add(x = var_6122_cast_fp16, y = inputs_43_cast_fp16)[name = tensor("inputs_45_cast_fp16")]; + tensor var_6126 = const()[name = tensor("op_6126"), val = tensor([1])]; + tensor channels_mean_45_cast_fp16 = reduce_mean(axes = var_6126, keep_dims = var_5594, x = inputs_45_cast_fp16)[name = tensor("channels_mean_45_cast_fp16")]; + tensor zero_mean_45_cast_fp16 = sub(x = inputs_45_cast_fp16, y = channels_mean_45_cast_fp16)[name = tensor("zero_mean_45_cast_fp16")]; + tensor zero_mean_sq_45_cast_fp16 = mul(x = zero_mean_45_cast_fp16, y = zero_mean_45_cast_fp16)[name = tensor("zero_mean_sq_45_cast_fp16")]; + tensor var_6130 = const()[name = tensor("op_6130"), val = tensor([1])]; + tensor var_6131_cast_fp16 = reduce_mean(axes = var_6130, keep_dims = var_5594, x = zero_mean_sq_45_cast_fp16)[name = tensor("op_6131_cast_fp16")]; + tensor var_6132_to_fp16 = const()[name = tensor("op_6132_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_6133_cast_fp16 = add(x = var_6131_cast_fp16, y = var_6132_to_fp16)[name = tensor("op_6133_cast_fp16")]; + tensor denom_45_epsilon_0_to_fp16 = const()[name = tensor("denom_45_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_45_cast_fp16 = rsqrt(epsilon = denom_45_epsilon_0_to_fp16, x = var_6133_cast_fp16)[name = tensor("denom_45_cast_fp16")]; + tensor out_45_cast_fp16 = mul(x = zero_mean_45_cast_fp16, y = denom_45_cast_fp16)[name = tensor("out_45_cast_fp16")]; + tensor var_6137_to_fp16 = const()[name = tensor("op_6137_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1142578816)))]; + tensor var_6138_cast_fp16 = add(x = out_45_cast_fp16, y = var_6137_to_fp16)[name = tensor("op_6138_cast_fp16")]; + tensor var_6140_to_fp16 = const()[name = tensor("op_6140_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1142581440)))]; + tensor hidden_states_169_cast_fp16 = mul(x = var_6138_cast_fp16, y = var_6140_to_fp16)[name = tensor("hidden_states_169_cast_fp16")]; + tensor var_6147 = const()[name = tensor("op_6147"), val = tensor([1, 1])]; + tensor var_6149 = const()[name = tensor("op_6149"), val = tensor([1, 1])]; + tensor q_31_pad_type_0 = const()[name = tensor("q_31_pad_type_0"), val = tensor("custom")]; + tensor q_31_pad_0 = const()[name = tensor("q_31_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1142584064)))]; + tensor q_31_cast_fp16 = conv(dilations = var_6149, groups = var_5599, pad = q_31_pad_0, pad_type = q_31_pad_type_0, strides = var_6147, weight = up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_169_cast_fp16)[name = tensor("q_31_cast_fp16")]; + tensor var_6153 = const()[name = tensor("op_6153"), val = tensor([1, 1])]; + tensor var_6155 = const()[name = tensor("op_6155"), val = tensor([1, 1])]; + tensor k_61_pad_type_0 = const()[name = tensor("k_61_pad_type_0"), val = tensor("custom")]; + tensor k_61_pad_0 = const()[name = tensor("k_61_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1145860928)))]; + tensor k_61_cast_fp16 = conv(dilations = var_6155, groups = var_5599, pad = k_61_pad_0, pad_type = k_61_pad_type_0, strides = var_6153, weight = up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_61_cast_fp16")]; + tensor var_6159 = const()[name = tensor("op_6159"), val = tensor([1, 1])]; + tensor var_6161 = const()[name = tensor("op_6161"), val = tensor([1, 1])]; + tensor v_31_pad_type_0 = const()[name = tensor("v_31_pad_type_0"), val = tensor("custom")]; + tensor v_31_pad_0 = const()[name = tensor("v_31_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1148482432)))]; + tensor v_31_cast_fp16 = conv(dilations = var_6161, groups = var_5599, pad = v_31_pad_0, pad_type = v_31_pad_type_0, strides = var_6159, weight = up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_31_cast_fp16")]; + tensor var_6165_begin_0 = const()[name = tensor("op_6165_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_6165_end_0 = const()[name = tensor("op_6165_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_6165_end_mask_0 = const()[name = tensor("op_6165_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6165_cast_fp16 = slice_by_index(begin = var_6165_begin_0, end = var_6165_end_0, end_mask = var_6165_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6165_cast_fp16")]; + tensor var_6169_begin_0 = const()[name = tensor("op_6169_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_6169_end_0 = const()[name = tensor("op_6169_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_6169_end_mask_0 = const()[name = tensor("op_6169_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6169_cast_fp16 = slice_by_index(begin = var_6169_begin_0, end = var_6169_end_0, end_mask = var_6169_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6169_cast_fp16")]; + tensor var_6173_begin_0 = const()[name = tensor("op_6173_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_6173_end_0 = const()[name = tensor("op_6173_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_6173_end_mask_0 = const()[name = tensor("op_6173_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6173_cast_fp16 = slice_by_index(begin = var_6173_begin_0, end = var_6173_end_0, end_mask = var_6173_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6173_cast_fp16")]; + tensor var_6177_begin_0 = const()[name = tensor("op_6177_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_6177_end_0 = const()[name = tensor("op_6177_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_6177_end_mask_0 = const()[name = tensor("op_6177_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6177_cast_fp16 = slice_by_index(begin = var_6177_begin_0, end = var_6177_end_0, end_mask = var_6177_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6177_cast_fp16")]; + tensor var_6181_begin_0 = const()[name = tensor("op_6181_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_6181_end_0 = const()[name = tensor("op_6181_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_6181_end_mask_0 = const()[name = tensor("op_6181_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6181_cast_fp16 = slice_by_index(begin = var_6181_begin_0, end = var_6181_end_0, end_mask = var_6181_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6181_cast_fp16")]; + tensor var_6185_begin_0 = const()[name = tensor("op_6185_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_6185_end_0 = const()[name = tensor("op_6185_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_6185_end_mask_0 = const()[name = tensor("op_6185_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6185_cast_fp16 = slice_by_index(begin = var_6185_begin_0, end = var_6185_end_0, end_mask = var_6185_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6185_cast_fp16")]; + tensor var_6189_begin_0 = const()[name = tensor("op_6189_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_6189_end_0 = const()[name = tensor("op_6189_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_6189_end_mask_0 = const()[name = tensor("op_6189_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6189_cast_fp16 = slice_by_index(begin = var_6189_begin_0, end = var_6189_end_0, end_mask = var_6189_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6189_cast_fp16")]; + tensor var_6193_begin_0 = const()[name = tensor("op_6193_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_6193_end_0 = const()[name = tensor("op_6193_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_6193_end_mask_0 = const()[name = tensor("op_6193_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6193_cast_fp16 = slice_by_index(begin = var_6193_begin_0, end = var_6193_end_0, end_mask = var_6193_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6193_cast_fp16")]; + tensor var_6197_begin_0 = const()[name = tensor("op_6197_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_6197_end_0 = const()[name = tensor("op_6197_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_6197_end_mask_0 = const()[name = tensor("op_6197_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6197_cast_fp16 = slice_by_index(begin = var_6197_begin_0, end = var_6197_end_0, end_mask = var_6197_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6197_cast_fp16")]; + tensor var_6201_begin_0 = const()[name = tensor("op_6201_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_6201_end_0 = const()[name = tensor("op_6201_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_6201_end_mask_0 = const()[name = tensor("op_6201_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6201_cast_fp16 = slice_by_index(begin = var_6201_begin_0, end = var_6201_end_0, end_mask = var_6201_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6201_cast_fp16")]; + tensor var_6205_begin_0 = const()[name = tensor("op_6205_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_6205_end_0 = const()[name = tensor("op_6205_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_6205_end_mask_0 = const()[name = tensor("op_6205_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6205_cast_fp16 = slice_by_index(begin = var_6205_begin_0, end = var_6205_end_0, end_mask = var_6205_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6205_cast_fp16")]; + tensor var_6209_begin_0 = const()[name = tensor("op_6209_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_6209_end_0 = const()[name = tensor("op_6209_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_6209_end_mask_0 = const()[name = tensor("op_6209_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6209_cast_fp16 = slice_by_index(begin = var_6209_begin_0, end = var_6209_end_0, end_mask = var_6209_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6209_cast_fp16")]; + tensor var_6213_begin_0 = const()[name = tensor("op_6213_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_6213_end_0 = const()[name = tensor("op_6213_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_6213_end_mask_0 = const()[name = tensor("op_6213_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6213_cast_fp16 = slice_by_index(begin = var_6213_begin_0, end = var_6213_end_0, end_mask = var_6213_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6213_cast_fp16")]; + tensor var_6217_begin_0 = const()[name = tensor("op_6217_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_6217_end_0 = const()[name = tensor("op_6217_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_6217_end_mask_0 = const()[name = tensor("op_6217_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6217_cast_fp16 = slice_by_index(begin = var_6217_begin_0, end = var_6217_end_0, end_mask = var_6217_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6217_cast_fp16")]; + tensor var_6221_begin_0 = const()[name = tensor("op_6221_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_6221_end_0 = const()[name = tensor("op_6221_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_6221_end_mask_0 = const()[name = tensor("op_6221_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6221_cast_fp16 = slice_by_index(begin = var_6221_begin_0, end = var_6221_end_0, end_mask = var_6221_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6221_cast_fp16")]; + tensor var_6225_begin_0 = const()[name = tensor("op_6225_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_6225_end_0 = const()[name = tensor("op_6225_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_6225_end_mask_0 = const()[name = tensor("op_6225_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6225_cast_fp16 = slice_by_index(begin = var_6225_begin_0, end = var_6225_end_0, end_mask = var_6225_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6225_cast_fp16")]; + tensor var_6229_begin_0 = const()[name = tensor("op_6229_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_6229_end_0 = const()[name = tensor("op_6229_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_6229_end_mask_0 = const()[name = tensor("op_6229_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6229_cast_fp16 = slice_by_index(begin = var_6229_begin_0, end = var_6229_end_0, end_mask = var_6229_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6229_cast_fp16")]; + tensor var_6233_begin_0 = const()[name = tensor("op_6233_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_6233_end_0 = const()[name = tensor("op_6233_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_6233_end_mask_0 = const()[name = tensor("op_6233_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6233_cast_fp16 = slice_by_index(begin = var_6233_begin_0, end = var_6233_end_0, end_mask = var_6233_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6233_cast_fp16")]; + tensor var_6237_begin_0 = const()[name = tensor("op_6237_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_6237_end_0 = const()[name = tensor("op_6237_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_6237_end_mask_0 = const()[name = tensor("op_6237_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6237_cast_fp16 = slice_by_index(begin = var_6237_begin_0, end = var_6237_end_0, end_mask = var_6237_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6237_cast_fp16")]; + tensor var_6241_begin_0 = const()[name = tensor("op_6241_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_6241_end_0 = const()[name = tensor("op_6241_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_6241_end_mask_0 = const()[name = tensor("op_6241_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6241_cast_fp16 = slice_by_index(begin = var_6241_begin_0, end = var_6241_end_0, end_mask = var_6241_end_mask_0, x = q_31_cast_fp16)[name = tensor("op_6241_cast_fp16")]; + tensor k_63_perm_0 = const()[name = tensor("k_63_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_6248_begin_0 = const()[name = tensor("op_6248_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_6248_end_0 = const()[name = tensor("op_6248_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_6248_end_mask_0 = const()[name = tensor("op_6248_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_16 = transpose(perm = k_63_perm_0, x = k_61_cast_fp16)[name = tensor("transpose_16")]; + tensor var_6248_cast_fp16 = slice_by_index(begin = var_6248_begin_0, end = var_6248_end_0, end_mask = var_6248_end_mask_0, x = transpose_16)[name = tensor("op_6248_cast_fp16")]; + tensor var_6252_begin_0 = const()[name = tensor("op_6252_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_6252_end_0 = const()[name = tensor("op_6252_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_6252_end_mask_0 = const()[name = tensor("op_6252_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6252_cast_fp16 = slice_by_index(begin = var_6252_begin_0, end = var_6252_end_0, end_mask = var_6252_end_mask_0, x = transpose_16)[name = tensor("op_6252_cast_fp16")]; + tensor var_6256_begin_0 = const()[name = tensor("op_6256_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_6256_end_0 = const()[name = tensor("op_6256_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_6256_end_mask_0 = const()[name = tensor("op_6256_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6256_cast_fp16 = slice_by_index(begin = var_6256_begin_0, end = var_6256_end_0, end_mask = var_6256_end_mask_0, x = transpose_16)[name = tensor("op_6256_cast_fp16")]; + tensor var_6260_begin_0 = const()[name = tensor("op_6260_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_6260_end_0 = const()[name = tensor("op_6260_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_6260_end_mask_0 = const()[name = tensor("op_6260_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6260_cast_fp16 = slice_by_index(begin = var_6260_begin_0, end = var_6260_end_0, end_mask = var_6260_end_mask_0, x = transpose_16)[name = tensor("op_6260_cast_fp16")]; + tensor var_6264_begin_0 = const()[name = tensor("op_6264_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_6264_end_0 = const()[name = tensor("op_6264_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_6264_end_mask_0 = const()[name = tensor("op_6264_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6264_cast_fp16 = slice_by_index(begin = var_6264_begin_0, end = var_6264_end_0, end_mask = var_6264_end_mask_0, x = transpose_16)[name = tensor("op_6264_cast_fp16")]; + tensor var_6268_begin_0 = const()[name = tensor("op_6268_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_6268_end_0 = const()[name = tensor("op_6268_end_0"), val = tensor([2, 77, 1, 384])]; + tensor var_6268_end_mask_0 = const()[name = tensor("op_6268_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6268_cast_fp16 = slice_by_index(begin = var_6268_begin_0, end = var_6268_end_0, end_mask = var_6268_end_mask_0, x = transpose_16)[name = tensor("op_6268_cast_fp16")]; + tensor var_6272_begin_0 = const()[name = tensor("op_6272_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_6272_end_0 = const()[name = tensor("op_6272_end_0"), val = tensor([2, 77, 1, 448])]; + tensor var_6272_end_mask_0 = const()[name = tensor("op_6272_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6272_cast_fp16 = slice_by_index(begin = var_6272_begin_0, end = var_6272_end_0, end_mask = var_6272_end_mask_0, x = transpose_16)[name = tensor("op_6272_cast_fp16")]; + tensor var_6276_begin_0 = const()[name = tensor("op_6276_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_6276_end_0 = const()[name = tensor("op_6276_end_0"), val = tensor([2, 77, 1, 512])]; + tensor var_6276_end_mask_0 = const()[name = tensor("op_6276_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6276_cast_fp16 = slice_by_index(begin = var_6276_begin_0, end = var_6276_end_0, end_mask = var_6276_end_mask_0, x = transpose_16)[name = tensor("op_6276_cast_fp16")]; + tensor var_6280_begin_0 = const()[name = tensor("op_6280_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_6280_end_0 = const()[name = tensor("op_6280_end_0"), val = tensor([2, 77, 1, 576])]; + tensor var_6280_end_mask_0 = const()[name = tensor("op_6280_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6280_cast_fp16 = slice_by_index(begin = var_6280_begin_0, end = var_6280_end_0, end_mask = var_6280_end_mask_0, x = transpose_16)[name = tensor("op_6280_cast_fp16")]; + tensor var_6284_begin_0 = const()[name = tensor("op_6284_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_6284_end_0 = const()[name = tensor("op_6284_end_0"), val = tensor([2, 77, 1, 640])]; + tensor var_6284_end_mask_0 = const()[name = tensor("op_6284_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6284_cast_fp16 = slice_by_index(begin = var_6284_begin_0, end = var_6284_end_0, end_mask = var_6284_end_mask_0, x = transpose_16)[name = tensor("op_6284_cast_fp16")]; + tensor var_6288_begin_0 = const()[name = tensor("op_6288_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_6288_end_0 = const()[name = tensor("op_6288_end_0"), val = tensor([2, 77, 1, 704])]; + tensor var_6288_end_mask_0 = const()[name = tensor("op_6288_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6288_cast_fp16 = slice_by_index(begin = var_6288_begin_0, end = var_6288_end_0, end_mask = var_6288_end_mask_0, x = transpose_16)[name = tensor("op_6288_cast_fp16")]; + tensor var_6292_begin_0 = const()[name = tensor("op_6292_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_6292_end_0 = const()[name = tensor("op_6292_end_0"), val = tensor([2, 77, 1, 768])]; + tensor var_6292_end_mask_0 = const()[name = tensor("op_6292_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6292_cast_fp16 = slice_by_index(begin = var_6292_begin_0, end = var_6292_end_0, end_mask = var_6292_end_mask_0, x = transpose_16)[name = tensor("op_6292_cast_fp16")]; + tensor var_6296_begin_0 = const()[name = tensor("op_6296_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_6296_end_0 = const()[name = tensor("op_6296_end_0"), val = tensor([2, 77, 1, 832])]; + tensor var_6296_end_mask_0 = const()[name = tensor("op_6296_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6296_cast_fp16 = slice_by_index(begin = var_6296_begin_0, end = var_6296_end_0, end_mask = var_6296_end_mask_0, x = transpose_16)[name = tensor("op_6296_cast_fp16")]; + tensor var_6300_begin_0 = const()[name = tensor("op_6300_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_6300_end_0 = const()[name = tensor("op_6300_end_0"), val = tensor([2, 77, 1, 896])]; + tensor var_6300_end_mask_0 = const()[name = tensor("op_6300_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6300_cast_fp16 = slice_by_index(begin = var_6300_begin_0, end = var_6300_end_0, end_mask = var_6300_end_mask_0, x = transpose_16)[name = tensor("op_6300_cast_fp16")]; + tensor var_6304_begin_0 = const()[name = tensor("op_6304_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_6304_end_0 = const()[name = tensor("op_6304_end_0"), val = tensor([2, 77, 1, 960])]; + tensor var_6304_end_mask_0 = const()[name = tensor("op_6304_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6304_cast_fp16 = slice_by_index(begin = var_6304_begin_0, end = var_6304_end_0, end_mask = var_6304_end_mask_0, x = transpose_16)[name = tensor("op_6304_cast_fp16")]; + tensor var_6308_begin_0 = const()[name = tensor("op_6308_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_6308_end_0 = const()[name = tensor("op_6308_end_0"), val = tensor([2, 77, 1, 1024])]; + tensor var_6308_end_mask_0 = const()[name = tensor("op_6308_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6308_cast_fp16 = slice_by_index(begin = var_6308_begin_0, end = var_6308_end_0, end_mask = var_6308_end_mask_0, x = transpose_16)[name = tensor("op_6308_cast_fp16")]; + tensor var_6312_begin_0 = const()[name = tensor("op_6312_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_6312_end_0 = const()[name = tensor("op_6312_end_0"), val = tensor([2, 77, 1, 1088])]; + tensor var_6312_end_mask_0 = const()[name = tensor("op_6312_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6312_cast_fp16 = slice_by_index(begin = var_6312_begin_0, end = var_6312_end_0, end_mask = var_6312_end_mask_0, x = transpose_16)[name = tensor("op_6312_cast_fp16")]; + tensor var_6316_begin_0 = const()[name = tensor("op_6316_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_6316_end_0 = const()[name = tensor("op_6316_end_0"), val = tensor([2, 77, 1, 1152])]; + tensor var_6316_end_mask_0 = const()[name = tensor("op_6316_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6316_cast_fp16 = slice_by_index(begin = var_6316_begin_0, end = var_6316_end_0, end_mask = var_6316_end_mask_0, x = transpose_16)[name = tensor("op_6316_cast_fp16")]; + tensor var_6320_begin_0 = const()[name = tensor("op_6320_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_6320_end_0 = const()[name = tensor("op_6320_end_0"), val = tensor([2, 77, 1, 1216])]; + tensor var_6320_end_mask_0 = const()[name = tensor("op_6320_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6320_cast_fp16 = slice_by_index(begin = var_6320_begin_0, end = var_6320_end_0, end_mask = var_6320_end_mask_0, x = transpose_16)[name = tensor("op_6320_cast_fp16")]; + tensor var_6324_begin_0 = const()[name = tensor("op_6324_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_6324_end_0 = const()[name = tensor("op_6324_end_0"), val = tensor([2, 77, 1, 1280])]; + tensor var_6324_end_mask_0 = const()[name = tensor("op_6324_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6324_cast_fp16 = slice_by_index(begin = var_6324_begin_0, end = var_6324_end_0, end_mask = var_6324_end_mask_0, x = transpose_16)[name = tensor("op_6324_cast_fp16")]; + tensor var_6326_begin_0 = const()[name = tensor("op_6326_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_6326_end_0 = const()[name = tensor("op_6326_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_6326_end_mask_0 = const()[name = tensor("op_6326_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6326_cast_fp16 = slice_by_index(begin = var_6326_begin_0, end = var_6326_end_0, end_mask = var_6326_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6326_cast_fp16")]; + tensor var_6330_begin_0 = const()[name = tensor("op_6330_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_6330_end_0 = const()[name = tensor("op_6330_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_6330_end_mask_0 = const()[name = tensor("op_6330_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6330_cast_fp16 = slice_by_index(begin = var_6330_begin_0, end = var_6330_end_0, end_mask = var_6330_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6330_cast_fp16")]; + tensor var_6334_begin_0 = const()[name = tensor("op_6334_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_6334_end_0 = const()[name = tensor("op_6334_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_6334_end_mask_0 = const()[name = tensor("op_6334_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6334_cast_fp16 = slice_by_index(begin = var_6334_begin_0, end = var_6334_end_0, end_mask = var_6334_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6334_cast_fp16")]; + tensor var_6338_begin_0 = const()[name = tensor("op_6338_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_6338_end_0 = const()[name = tensor("op_6338_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_6338_end_mask_0 = const()[name = tensor("op_6338_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6338_cast_fp16 = slice_by_index(begin = var_6338_begin_0, end = var_6338_end_0, end_mask = var_6338_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6338_cast_fp16")]; + tensor var_6342_begin_0 = const()[name = tensor("op_6342_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_6342_end_0 = const()[name = tensor("op_6342_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_6342_end_mask_0 = const()[name = tensor("op_6342_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6342_cast_fp16 = slice_by_index(begin = var_6342_begin_0, end = var_6342_end_0, end_mask = var_6342_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6342_cast_fp16")]; + tensor var_6346_begin_0 = const()[name = tensor("op_6346_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_6346_end_0 = const()[name = tensor("op_6346_end_0"), val = tensor([2, 384, 1, 77])]; + tensor var_6346_end_mask_0 = const()[name = tensor("op_6346_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6346_cast_fp16 = slice_by_index(begin = var_6346_begin_0, end = var_6346_end_0, end_mask = var_6346_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6346_cast_fp16")]; + tensor var_6350_begin_0 = const()[name = tensor("op_6350_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_6350_end_0 = const()[name = tensor("op_6350_end_0"), val = tensor([2, 448, 1, 77])]; + tensor var_6350_end_mask_0 = const()[name = tensor("op_6350_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6350_cast_fp16 = slice_by_index(begin = var_6350_begin_0, end = var_6350_end_0, end_mask = var_6350_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6350_cast_fp16")]; + tensor var_6354_begin_0 = const()[name = tensor("op_6354_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_6354_end_0 = const()[name = tensor("op_6354_end_0"), val = tensor([2, 512, 1, 77])]; + tensor var_6354_end_mask_0 = const()[name = tensor("op_6354_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6354_cast_fp16 = slice_by_index(begin = var_6354_begin_0, end = var_6354_end_0, end_mask = var_6354_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6354_cast_fp16")]; + tensor var_6358_begin_0 = const()[name = tensor("op_6358_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_6358_end_0 = const()[name = tensor("op_6358_end_0"), val = tensor([2, 576, 1, 77])]; + tensor var_6358_end_mask_0 = const()[name = tensor("op_6358_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6358_cast_fp16 = slice_by_index(begin = var_6358_begin_0, end = var_6358_end_0, end_mask = var_6358_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6358_cast_fp16")]; + tensor var_6362_begin_0 = const()[name = tensor("op_6362_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_6362_end_0 = const()[name = tensor("op_6362_end_0"), val = tensor([2, 640, 1, 77])]; + tensor var_6362_end_mask_0 = const()[name = tensor("op_6362_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6362_cast_fp16 = slice_by_index(begin = var_6362_begin_0, end = var_6362_end_0, end_mask = var_6362_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6362_cast_fp16")]; + tensor var_6366_begin_0 = const()[name = tensor("op_6366_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_6366_end_0 = const()[name = tensor("op_6366_end_0"), val = tensor([2, 704, 1, 77])]; + tensor var_6366_end_mask_0 = const()[name = tensor("op_6366_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6366_cast_fp16 = slice_by_index(begin = var_6366_begin_0, end = var_6366_end_0, end_mask = var_6366_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6366_cast_fp16")]; + tensor var_6370_begin_0 = const()[name = tensor("op_6370_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_6370_end_0 = const()[name = tensor("op_6370_end_0"), val = tensor([2, 768, 1, 77])]; + tensor var_6370_end_mask_0 = const()[name = tensor("op_6370_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6370_cast_fp16 = slice_by_index(begin = var_6370_begin_0, end = var_6370_end_0, end_mask = var_6370_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6370_cast_fp16")]; + tensor var_6374_begin_0 = const()[name = tensor("op_6374_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_6374_end_0 = const()[name = tensor("op_6374_end_0"), val = tensor([2, 832, 1, 77])]; + tensor var_6374_end_mask_0 = const()[name = tensor("op_6374_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6374_cast_fp16 = slice_by_index(begin = var_6374_begin_0, end = var_6374_end_0, end_mask = var_6374_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6374_cast_fp16")]; + tensor var_6378_begin_0 = const()[name = tensor("op_6378_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_6378_end_0 = const()[name = tensor("op_6378_end_0"), val = tensor([2, 896, 1, 77])]; + tensor var_6378_end_mask_0 = const()[name = tensor("op_6378_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6378_cast_fp16 = slice_by_index(begin = var_6378_begin_0, end = var_6378_end_0, end_mask = var_6378_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6378_cast_fp16")]; + tensor var_6382_begin_0 = const()[name = tensor("op_6382_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_6382_end_0 = const()[name = tensor("op_6382_end_0"), val = tensor([2, 960, 1, 77])]; + tensor var_6382_end_mask_0 = const()[name = tensor("op_6382_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6382_cast_fp16 = slice_by_index(begin = var_6382_begin_0, end = var_6382_end_0, end_mask = var_6382_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6382_cast_fp16")]; + tensor var_6386_begin_0 = const()[name = tensor("op_6386_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_6386_end_0 = const()[name = tensor("op_6386_end_0"), val = tensor([2, 1024, 1, 77])]; + tensor var_6386_end_mask_0 = const()[name = tensor("op_6386_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6386_cast_fp16 = slice_by_index(begin = var_6386_begin_0, end = var_6386_end_0, end_mask = var_6386_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6386_cast_fp16")]; + tensor var_6390_begin_0 = const()[name = tensor("op_6390_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_6390_end_0 = const()[name = tensor("op_6390_end_0"), val = tensor([2, 1088, 1, 77])]; + tensor var_6390_end_mask_0 = const()[name = tensor("op_6390_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6390_cast_fp16 = slice_by_index(begin = var_6390_begin_0, end = var_6390_end_0, end_mask = var_6390_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6390_cast_fp16")]; + tensor var_6394_begin_0 = const()[name = tensor("op_6394_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_6394_end_0 = const()[name = tensor("op_6394_end_0"), val = tensor([2, 1152, 1, 77])]; + tensor var_6394_end_mask_0 = const()[name = tensor("op_6394_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6394_cast_fp16 = slice_by_index(begin = var_6394_begin_0, end = var_6394_end_0, end_mask = var_6394_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6394_cast_fp16")]; + tensor var_6398_begin_0 = const()[name = tensor("op_6398_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_6398_end_0 = const()[name = tensor("op_6398_end_0"), val = tensor([2, 1216, 1, 77])]; + tensor var_6398_end_mask_0 = const()[name = tensor("op_6398_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6398_cast_fp16 = slice_by_index(begin = var_6398_begin_0, end = var_6398_end_0, end_mask = var_6398_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6398_cast_fp16")]; + tensor var_6402_begin_0 = const()[name = tensor("op_6402_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_6402_end_0 = const()[name = tensor("op_6402_end_0"), val = tensor([2, 1280, 1, 77])]; + tensor var_6402_end_mask_0 = const()[name = tensor("op_6402_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6402_cast_fp16 = slice_by_index(begin = var_6402_begin_0, end = var_6402_end_0, end_mask = var_6402_end_mask_0, x = v_31_cast_fp16)[name = tensor("op_6402_cast_fp16")]; + tensor var_6406_equation_0 = const()[name = tensor("op_6406_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6406_cast_fp16 = einsum(equation = var_6406_equation_0, values = (var_6248_cast_fp16, var_6165_cast_fp16))[name = tensor("op_6406_cast_fp16")]; + tensor var_6407_to_fp16 = const()[name = tensor("op_6407_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_401_cast_fp16 = mul(x = var_6406_cast_fp16, y = var_6407_to_fp16)[name = tensor("aw_401_cast_fp16")]; + tensor var_6410_equation_0 = const()[name = tensor("op_6410_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6410_cast_fp16 = einsum(equation = var_6410_equation_0, values = (var_6252_cast_fp16, var_6169_cast_fp16))[name = tensor("op_6410_cast_fp16")]; + tensor var_6411_to_fp16 = const()[name = tensor("op_6411_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_403_cast_fp16 = mul(x = var_6410_cast_fp16, y = var_6411_to_fp16)[name = tensor("aw_403_cast_fp16")]; + tensor var_6414_equation_0 = const()[name = tensor("op_6414_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6414_cast_fp16 = einsum(equation = var_6414_equation_0, values = (var_6256_cast_fp16, var_6173_cast_fp16))[name = tensor("op_6414_cast_fp16")]; + tensor var_6415_to_fp16 = const()[name = tensor("op_6415_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_405_cast_fp16 = mul(x = var_6414_cast_fp16, y = var_6415_to_fp16)[name = tensor("aw_405_cast_fp16")]; + tensor var_6418_equation_0 = const()[name = tensor("op_6418_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6418_cast_fp16 = einsum(equation = var_6418_equation_0, values = (var_6260_cast_fp16, var_6177_cast_fp16))[name = tensor("op_6418_cast_fp16")]; + tensor var_6419_to_fp16 = const()[name = tensor("op_6419_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_407_cast_fp16 = mul(x = var_6418_cast_fp16, y = var_6419_to_fp16)[name = tensor("aw_407_cast_fp16")]; + tensor var_6422_equation_0 = const()[name = tensor("op_6422_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6422_cast_fp16 = einsum(equation = var_6422_equation_0, values = (var_6264_cast_fp16, var_6181_cast_fp16))[name = tensor("op_6422_cast_fp16")]; + tensor var_6423_to_fp16 = const()[name = tensor("op_6423_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_409_cast_fp16 = mul(x = var_6422_cast_fp16, y = var_6423_to_fp16)[name = tensor("aw_409_cast_fp16")]; + tensor var_6426_equation_0 = const()[name = tensor("op_6426_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6426_cast_fp16 = einsum(equation = var_6426_equation_0, values = (var_6268_cast_fp16, var_6185_cast_fp16))[name = tensor("op_6426_cast_fp16")]; + tensor var_6427_to_fp16 = const()[name = tensor("op_6427_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_411_cast_fp16 = mul(x = var_6426_cast_fp16, y = var_6427_to_fp16)[name = tensor("aw_411_cast_fp16")]; + tensor var_6430_equation_0 = const()[name = tensor("op_6430_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6430_cast_fp16 = einsum(equation = var_6430_equation_0, values = (var_6272_cast_fp16, var_6189_cast_fp16))[name = tensor("op_6430_cast_fp16")]; + tensor var_6431_to_fp16 = const()[name = tensor("op_6431_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_413_cast_fp16 = mul(x = var_6430_cast_fp16, y = var_6431_to_fp16)[name = tensor("aw_413_cast_fp16")]; + tensor var_6434_equation_0 = const()[name = tensor("op_6434_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6434_cast_fp16 = einsum(equation = var_6434_equation_0, values = (var_6276_cast_fp16, var_6193_cast_fp16))[name = tensor("op_6434_cast_fp16")]; + tensor var_6435_to_fp16 = const()[name = tensor("op_6435_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_415_cast_fp16 = mul(x = var_6434_cast_fp16, y = var_6435_to_fp16)[name = tensor("aw_415_cast_fp16")]; + tensor var_6438_equation_0 = const()[name = tensor("op_6438_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6438_cast_fp16 = einsum(equation = var_6438_equation_0, values = (var_6280_cast_fp16, var_6197_cast_fp16))[name = tensor("op_6438_cast_fp16")]; + tensor var_6439_to_fp16 = const()[name = tensor("op_6439_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_417_cast_fp16 = mul(x = var_6438_cast_fp16, y = var_6439_to_fp16)[name = tensor("aw_417_cast_fp16")]; + tensor var_6442_equation_0 = const()[name = tensor("op_6442_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6442_cast_fp16 = einsum(equation = var_6442_equation_0, values = (var_6284_cast_fp16, var_6201_cast_fp16))[name = tensor("op_6442_cast_fp16")]; + tensor var_6443_to_fp16 = const()[name = tensor("op_6443_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_419_cast_fp16 = mul(x = var_6442_cast_fp16, y = var_6443_to_fp16)[name = tensor("aw_419_cast_fp16")]; + tensor var_6446_equation_0 = const()[name = tensor("op_6446_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6446_cast_fp16 = einsum(equation = var_6446_equation_0, values = (var_6288_cast_fp16, var_6205_cast_fp16))[name = tensor("op_6446_cast_fp16")]; + tensor var_6447_to_fp16 = const()[name = tensor("op_6447_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_421_cast_fp16 = mul(x = var_6446_cast_fp16, y = var_6447_to_fp16)[name = tensor("aw_421_cast_fp16")]; + tensor var_6450_equation_0 = const()[name = tensor("op_6450_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6450_cast_fp16 = einsum(equation = var_6450_equation_0, values = (var_6292_cast_fp16, var_6209_cast_fp16))[name = tensor("op_6450_cast_fp16")]; + tensor var_6451_to_fp16 = const()[name = tensor("op_6451_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_423_cast_fp16 = mul(x = var_6450_cast_fp16, y = var_6451_to_fp16)[name = tensor("aw_423_cast_fp16")]; + tensor var_6454_equation_0 = const()[name = tensor("op_6454_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6454_cast_fp16 = einsum(equation = var_6454_equation_0, values = (var_6296_cast_fp16, var_6213_cast_fp16))[name = tensor("op_6454_cast_fp16")]; + tensor var_6455_to_fp16 = const()[name = tensor("op_6455_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_425_cast_fp16 = mul(x = var_6454_cast_fp16, y = var_6455_to_fp16)[name = tensor("aw_425_cast_fp16")]; + tensor var_6458_equation_0 = const()[name = tensor("op_6458_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6458_cast_fp16 = einsum(equation = var_6458_equation_0, values = (var_6300_cast_fp16, var_6217_cast_fp16))[name = tensor("op_6458_cast_fp16")]; + tensor var_6459_to_fp16 = const()[name = tensor("op_6459_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_427_cast_fp16 = mul(x = var_6458_cast_fp16, y = var_6459_to_fp16)[name = tensor("aw_427_cast_fp16")]; + tensor var_6462_equation_0 = const()[name = tensor("op_6462_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6462_cast_fp16 = einsum(equation = var_6462_equation_0, values = (var_6304_cast_fp16, var_6221_cast_fp16))[name = tensor("op_6462_cast_fp16")]; + tensor var_6463_to_fp16 = const()[name = tensor("op_6463_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_429_cast_fp16 = mul(x = var_6462_cast_fp16, y = var_6463_to_fp16)[name = tensor("aw_429_cast_fp16")]; + tensor var_6466_equation_0 = const()[name = tensor("op_6466_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6466_cast_fp16 = einsum(equation = var_6466_equation_0, values = (var_6308_cast_fp16, var_6225_cast_fp16))[name = tensor("op_6466_cast_fp16")]; + tensor var_6467_to_fp16 = const()[name = tensor("op_6467_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_431_cast_fp16 = mul(x = var_6466_cast_fp16, y = var_6467_to_fp16)[name = tensor("aw_431_cast_fp16")]; + tensor var_6470_equation_0 = const()[name = tensor("op_6470_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6470_cast_fp16 = einsum(equation = var_6470_equation_0, values = (var_6312_cast_fp16, var_6229_cast_fp16))[name = tensor("op_6470_cast_fp16")]; + tensor var_6471_to_fp16 = const()[name = tensor("op_6471_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_433_cast_fp16 = mul(x = var_6470_cast_fp16, y = var_6471_to_fp16)[name = tensor("aw_433_cast_fp16")]; + tensor var_6474_equation_0 = const()[name = tensor("op_6474_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6474_cast_fp16 = einsum(equation = var_6474_equation_0, values = (var_6316_cast_fp16, var_6233_cast_fp16))[name = tensor("op_6474_cast_fp16")]; + tensor var_6475_to_fp16 = const()[name = tensor("op_6475_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_435_cast_fp16 = mul(x = var_6474_cast_fp16, y = var_6475_to_fp16)[name = tensor("aw_435_cast_fp16")]; + tensor var_6478_equation_0 = const()[name = tensor("op_6478_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6478_cast_fp16 = einsum(equation = var_6478_equation_0, values = (var_6320_cast_fp16, var_6237_cast_fp16))[name = tensor("op_6478_cast_fp16")]; + tensor var_6479_to_fp16 = const()[name = tensor("op_6479_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_437_cast_fp16 = mul(x = var_6478_cast_fp16, y = var_6479_to_fp16)[name = tensor("aw_437_cast_fp16")]; + tensor var_6482_equation_0 = const()[name = tensor("op_6482_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6482_cast_fp16 = einsum(equation = var_6482_equation_0, values = (var_6324_cast_fp16, var_6241_cast_fp16))[name = tensor("op_6482_cast_fp16")]; + tensor var_6483_to_fp16 = const()[name = tensor("op_6483_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_439_cast_fp16 = mul(x = var_6482_cast_fp16, y = var_6483_to_fp16)[name = tensor("aw_439_cast_fp16")]; + tensor var_6485_cast_fp16 = softmax(axis = var_5599, x = aw_401_cast_fp16)[name = tensor("op_6485_cast_fp16")]; + tensor var_6486_cast_fp16 = softmax(axis = var_5599, x = aw_403_cast_fp16)[name = tensor("op_6486_cast_fp16")]; + tensor var_6487_cast_fp16 = softmax(axis = var_5599, x = aw_405_cast_fp16)[name = tensor("op_6487_cast_fp16")]; + tensor var_6488_cast_fp16 = softmax(axis = var_5599, x = aw_407_cast_fp16)[name = tensor("op_6488_cast_fp16")]; + tensor var_6489_cast_fp16 = softmax(axis = var_5599, x = aw_409_cast_fp16)[name = tensor("op_6489_cast_fp16")]; + tensor var_6490_cast_fp16 = softmax(axis = var_5599, x = aw_411_cast_fp16)[name = tensor("op_6490_cast_fp16")]; + tensor var_6491_cast_fp16 = softmax(axis = var_5599, x = aw_413_cast_fp16)[name = tensor("op_6491_cast_fp16")]; + tensor var_6492_cast_fp16 = softmax(axis = var_5599, x = aw_415_cast_fp16)[name = tensor("op_6492_cast_fp16")]; + tensor var_6493_cast_fp16 = softmax(axis = var_5599, x = aw_417_cast_fp16)[name = tensor("op_6493_cast_fp16")]; + tensor var_6494_cast_fp16 = softmax(axis = var_5599, x = aw_419_cast_fp16)[name = tensor("op_6494_cast_fp16")]; + tensor var_6495_cast_fp16 = softmax(axis = var_5599, x = aw_421_cast_fp16)[name = tensor("op_6495_cast_fp16")]; + tensor var_6496_cast_fp16 = softmax(axis = var_5599, x = aw_423_cast_fp16)[name = tensor("op_6496_cast_fp16")]; + tensor var_6497_cast_fp16 = softmax(axis = var_5599, x = aw_425_cast_fp16)[name = tensor("op_6497_cast_fp16")]; + tensor var_6498_cast_fp16 = softmax(axis = var_5599, x = aw_427_cast_fp16)[name = tensor("op_6498_cast_fp16")]; + tensor var_6499_cast_fp16 = softmax(axis = var_5599, x = aw_429_cast_fp16)[name = tensor("op_6499_cast_fp16")]; + tensor var_6500_cast_fp16 = softmax(axis = var_5599, x = aw_431_cast_fp16)[name = tensor("op_6500_cast_fp16")]; + tensor var_6501_cast_fp16 = softmax(axis = var_5599, x = aw_433_cast_fp16)[name = tensor("op_6501_cast_fp16")]; + tensor var_6502_cast_fp16 = softmax(axis = var_5599, x = aw_435_cast_fp16)[name = tensor("op_6502_cast_fp16")]; + tensor var_6503_cast_fp16 = softmax(axis = var_5599, x = aw_437_cast_fp16)[name = tensor("op_6503_cast_fp16")]; + tensor var_6504_cast_fp16 = softmax(axis = var_5599, x = aw_439_cast_fp16)[name = tensor("op_6504_cast_fp16")]; + tensor var_6506_equation_0 = const()[name = tensor("op_6506_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6506_cast_fp16 = einsum(equation = var_6506_equation_0, values = (var_6326_cast_fp16, var_6485_cast_fp16))[name = tensor("op_6506_cast_fp16")]; + tensor var_6508_equation_0 = const()[name = tensor("op_6508_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6508_cast_fp16 = einsum(equation = var_6508_equation_0, values = (var_6330_cast_fp16, var_6486_cast_fp16))[name = tensor("op_6508_cast_fp16")]; + tensor var_6510_equation_0 = const()[name = tensor("op_6510_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6510_cast_fp16 = einsum(equation = var_6510_equation_0, values = (var_6334_cast_fp16, var_6487_cast_fp16))[name = tensor("op_6510_cast_fp16")]; + tensor var_6512_equation_0 = const()[name = tensor("op_6512_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6512_cast_fp16 = einsum(equation = var_6512_equation_0, values = (var_6338_cast_fp16, var_6488_cast_fp16))[name = tensor("op_6512_cast_fp16")]; + tensor var_6514_equation_0 = const()[name = tensor("op_6514_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6514_cast_fp16 = einsum(equation = var_6514_equation_0, values = (var_6342_cast_fp16, var_6489_cast_fp16))[name = tensor("op_6514_cast_fp16")]; + tensor var_6516_equation_0 = const()[name = tensor("op_6516_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6516_cast_fp16 = einsum(equation = var_6516_equation_0, values = (var_6346_cast_fp16, var_6490_cast_fp16))[name = tensor("op_6516_cast_fp16")]; + tensor var_6518_equation_0 = const()[name = tensor("op_6518_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6518_cast_fp16 = einsum(equation = var_6518_equation_0, values = (var_6350_cast_fp16, var_6491_cast_fp16))[name = tensor("op_6518_cast_fp16")]; + tensor var_6520_equation_0 = const()[name = tensor("op_6520_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6520_cast_fp16 = einsum(equation = var_6520_equation_0, values = (var_6354_cast_fp16, var_6492_cast_fp16))[name = tensor("op_6520_cast_fp16")]; + tensor var_6522_equation_0 = const()[name = tensor("op_6522_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6522_cast_fp16 = einsum(equation = var_6522_equation_0, values = (var_6358_cast_fp16, var_6493_cast_fp16))[name = tensor("op_6522_cast_fp16")]; + tensor var_6524_equation_0 = const()[name = tensor("op_6524_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6524_cast_fp16 = einsum(equation = var_6524_equation_0, values = (var_6362_cast_fp16, var_6494_cast_fp16))[name = tensor("op_6524_cast_fp16")]; + tensor var_6526_equation_0 = const()[name = tensor("op_6526_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6526_cast_fp16 = einsum(equation = var_6526_equation_0, values = (var_6366_cast_fp16, var_6495_cast_fp16))[name = tensor("op_6526_cast_fp16")]; + tensor var_6528_equation_0 = const()[name = tensor("op_6528_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6528_cast_fp16 = einsum(equation = var_6528_equation_0, values = (var_6370_cast_fp16, var_6496_cast_fp16))[name = tensor("op_6528_cast_fp16")]; + tensor var_6530_equation_0 = const()[name = tensor("op_6530_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6530_cast_fp16 = einsum(equation = var_6530_equation_0, values = (var_6374_cast_fp16, var_6497_cast_fp16))[name = tensor("op_6530_cast_fp16")]; + tensor var_6532_equation_0 = const()[name = tensor("op_6532_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6532_cast_fp16 = einsum(equation = var_6532_equation_0, values = (var_6378_cast_fp16, var_6498_cast_fp16))[name = tensor("op_6532_cast_fp16")]; + tensor var_6534_equation_0 = const()[name = tensor("op_6534_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6534_cast_fp16 = einsum(equation = var_6534_equation_0, values = (var_6382_cast_fp16, var_6499_cast_fp16))[name = tensor("op_6534_cast_fp16")]; + tensor var_6536_equation_0 = const()[name = tensor("op_6536_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6536_cast_fp16 = einsum(equation = var_6536_equation_0, values = (var_6386_cast_fp16, var_6500_cast_fp16))[name = tensor("op_6536_cast_fp16")]; + tensor var_6538_equation_0 = const()[name = tensor("op_6538_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6538_cast_fp16 = einsum(equation = var_6538_equation_0, values = (var_6390_cast_fp16, var_6501_cast_fp16))[name = tensor("op_6538_cast_fp16")]; + tensor var_6540_equation_0 = const()[name = tensor("op_6540_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6540_cast_fp16 = einsum(equation = var_6540_equation_0, values = (var_6394_cast_fp16, var_6502_cast_fp16))[name = tensor("op_6540_cast_fp16")]; + tensor var_6542_equation_0 = const()[name = tensor("op_6542_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6542_cast_fp16 = einsum(equation = var_6542_equation_0, values = (var_6398_cast_fp16, var_6503_cast_fp16))[name = tensor("op_6542_cast_fp16")]; + tensor var_6544_equation_0 = const()[name = tensor("op_6544_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_6544_cast_fp16 = einsum(equation = var_6544_equation_0, values = (var_6402_cast_fp16, var_6504_cast_fp16))[name = tensor("op_6544_cast_fp16")]; + tensor input_303_interleave_0 = const()[name = tensor("input_303_interleave_0"), val = tensor(false)]; + tensor input_303_cast_fp16 = concat(axis = var_5599, interleave = input_303_interleave_0, values = (var_6506_cast_fp16, var_6508_cast_fp16, var_6510_cast_fp16, var_6512_cast_fp16, var_6514_cast_fp16, var_6516_cast_fp16, var_6518_cast_fp16, var_6520_cast_fp16, var_6522_cast_fp16, var_6524_cast_fp16, var_6526_cast_fp16, var_6528_cast_fp16, var_6530_cast_fp16, var_6532_cast_fp16, var_6534_cast_fp16, var_6536_cast_fp16, var_6538_cast_fp16, var_6540_cast_fp16, var_6542_cast_fp16, var_6544_cast_fp16))[name = tensor("input_303_cast_fp16")]; + tensor var_6550 = const()[name = tensor("op_6550"), val = tensor([1, 1])]; + tensor var_6552 = const()[name = tensor("op_6552"), val = tensor([1, 1])]; + tensor var_6554_pad_type_0 = const()[name = tensor("op_6554_pad_type_0"), val = tensor("custom")]; + tensor var_6554_pad_0 = const()[name = tensor("op_6554_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1151103936)))]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1154380800)))]; + tensor var_6554_cast_fp16 = conv(bias = up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_6552, groups = var_5599, pad = var_6554_pad_0, pad_type = var_6554_pad_type_0, strides = var_6550, weight = up_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_303_cast_fp16)[name = tensor("op_6554_cast_fp16")]; + tensor inputs_47_cast_fp16 = add(x = var_6554_cast_fp16, y = inputs_45_cast_fp16)[name = tensor("inputs_47_cast_fp16")]; + tensor var_6558 = const()[name = tensor("op_6558"), val = tensor([1])]; + tensor channels_mean_47_cast_fp16 = reduce_mean(axes = var_6558, keep_dims = var_5594, x = inputs_47_cast_fp16)[name = tensor("channels_mean_47_cast_fp16")]; + tensor zero_mean_47_cast_fp16 = sub(x = inputs_47_cast_fp16, y = channels_mean_47_cast_fp16)[name = tensor("zero_mean_47_cast_fp16")]; + tensor zero_mean_sq_47_cast_fp16 = mul(x = zero_mean_47_cast_fp16, y = zero_mean_47_cast_fp16)[name = tensor("zero_mean_sq_47_cast_fp16")]; + tensor var_6562 = const()[name = tensor("op_6562"), val = tensor([1])]; + tensor var_6563_cast_fp16 = reduce_mean(axes = var_6562, keep_dims = var_5594, x = zero_mean_sq_47_cast_fp16)[name = tensor("op_6563_cast_fp16")]; + tensor var_6564_to_fp16 = const()[name = tensor("op_6564_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_6565_cast_fp16 = add(x = var_6563_cast_fp16, y = var_6564_to_fp16)[name = tensor("op_6565_cast_fp16")]; + tensor denom_47_epsilon_0_to_fp16 = const()[name = tensor("denom_47_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_47_cast_fp16 = rsqrt(epsilon = denom_47_epsilon_0_to_fp16, x = var_6565_cast_fp16)[name = tensor("denom_47_cast_fp16")]; + tensor out_47_cast_fp16 = mul(x = zero_mean_47_cast_fp16, y = denom_47_cast_fp16)[name = tensor("out_47_cast_fp16")]; + tensor var_6569_to_fp16 = const()[name = tensor("op_6569_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1154383424)))]; + tensor var_6570_cast_fp16 = add(x = out_47_cast_fp16, y = var_6569_to_fp16)[name = tensor("op_6570_cast_fp16")]; + tensor var_6572_to_fp16 = const()[name = tensor("op_6572_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1154386048)))]; + tensor input_305_cast_fp16 = mul(x = var_6570_cast_fp16, y = var_6572_to_fp16)[name = tensor("input_305_cast_fp16")]; + tensor var_6580 = const()[name = tensor("op_6580"), val = tensor([1, 1])]; + tensor var_6582 = const()[name = tensor("op_6582"), val = tensor([1, 1])]; + tensor var_6584_pad_type_0 = const()[name = tensor("op_6584_pad_type_0"), val = tensor("custom")]; + tensor var_6584_pad_0 = const()[name = tensor("op_6584_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1154388672)))]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1180603136)))]; + tensor var_6584_cast_fp16 = conv(bias = up_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_6582, groups = var_5599, pad = var_6584_pad_0, pad_type = var_6584_pad_type_0, strides = var_6580, weight = up_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_305_cast_fp16)[name = tensor("op_6584_cast_fp16")]; + tensor var_6585_split_sizes_0 = const()[name = tensor("op_6585_split_sizes_0"), val = tensor([5120, 5120])]; + tensor var_6585_axis_0 = const()[name = tensor("op_6585_axis_0"), val = tensor(1)]; + tensor var_6585_cast_fp16_0, tensor var_6585_cast_fp16_1 = split(axis = var_6585_axis_0, split_sizes = var_6585_split_sizes_0, x = var_6584_cast_fp16)[name = tensor("op_6585_cast_fp16")]; + tensor var_6587_mode_0 = const()[name = tensor("op_6587_mode_0"), val = tensor("EXACT")]; + tensor var_6587_cast_fp16 = gelu(mode = var_6587_mode_0, x = var_6585_cast_fp16_1)[name = tensor("op_6587_cast_fp16")]; + tensor input_307_cast_fp16 = mul(x = var_6585_cast_fp16_0, y = var_6587_cast_fp16)[name = tensor("input_307_cast_fp16")]; + tensor var_6591 = const()[name = tensor("op_6591"), val = tensor([1, 1])]; + tensor var_6593 = const()[name = tensor("op_6593"), val = tensor([1, 1])]; + tensor var_6595_pad_type_0 = const()[name = tensor("op_6595_pad_type_0"), val = tensor("custom")]; + tensor var_6595_pad_0 = const()[name = tensor("op_6595_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1180623680)))]; + tensor up_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1193730944)))]; + tensor var_6595_cast_fp16 = conv(bias = up_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_6593, groups = var_5599, pad = var_6595_pad_0, pad_type = var_6595_pad_type_0, strides = var_6591, weight = up_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_307_cast_fp16)[name = tensor("op_6595_cast_fp16")]; + tensor hidden_states_173_cast_fp16 = add(x = var_6595_cast_fp16, y = inputs_47_cast_fp16)[name = tensor("hidden_states_173_cast_fp16")]; + tensor var_6597 = const()[name = tensor("op_6597"), val = tensor([2, 1280, 12, 12])]; + tensor input_309_cast_fp16 = reshape(shape = var_6597, x = hidden_states_173_cast_fp16)[name = tensor("input_309_cast_fp16")]; + tensor var_6601 = const()[name = tensor("op_6601"), val = tensor([1, 1])]; + tensor var_6603 = const()[name = tensor("op_6603"), val = tensor([1, 1])]; + tensor hidden_states_175_pad_type_0 = const()[name = tensor("hidden_states_175_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_175_pad_0 = const()[name = tensor("hidden_states_175_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_0_proj_out_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1193733568)))]; + tensor up_blocks_1_attentions_0_proj_out_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_0_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1197010432)))]; + tensor hidden_states_175_cast_fp16 = conv(bias = up_blocks_1_attentions_0_proj_out_bias_to_fp16, dilations = var_6603, groups = var_5599, pad = hidden_states_175_pad_0, pad_type = hidden_states_175_pad_type_0, strides = var_6601, weight = up_blocks_1_attentions_0_proj_out_weight_to_fp16, x = input_309_cast_fp16)[name = tensor("hidden_states_175_cast_fp16")]; + tensor hidden_states_177_cast_fp16 = add(x = hidden_states_175_cast_fp16, y = hidden_states_163_cast_fp16)[name = tensor("hidden_states_177_cast_fp16")]; + tensor input_311_interleave_0 = const()[name = tensor("input_311_interleave_0"), val = tensor(false)]; + tensor input_311_cast_fp16 = concat(axis = var_5599, interleave = input_311_interleave_0, values = (hidden_states_177_cast_fp16, input_143_cast_fp16))[name = tensor("input_311_cast_fp16")]; + tensor reshape_144_shape_0 = const()[name = tensor("reshape_144_shape_0"), val = tensor([2, 32, 80, 12, 12])]; + tensor reshape_144_cast_fp16 = reshape(shape = reshape_144_shape_0, x = input_311_cast_fp16)[name = tensor("reshape_144_cast_fp16")]; + tensor reduce_mean_108_axes_0 = const()[name = tensor("reduce_mean_108_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_108_keep_dims_0 = const()[name = tensor("reduce_mean_108_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_108_cast_fp16 = reduce_mean(axes = reduce_mean_108_axes_0, keep_dims = reduce_mean_108_keep_dims_0, x = reshape_144_cast_fp16)[name = tensor("reduce_mean_108_cast_fp16")]; + tensor sub_72_cast_fp16 = sub(x = reshape_144_cast_fp16, y = reduce_mean_108_cast_fp16)[name = tensor("sub_72_cast_fp16")]; + tensor square_36_cast_fp16 = square(x = sub_72_cast_fp16)[name = tensor("square_36_cast_fp16")]; + tensor reduce_mean_110_axes_0 = const()[name = tensor("reduce_mean_110_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_110_keep_dims_0 = const()[name = tensor("reduce_mean_110_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_110_cast_fp16 = reduce_mean(axes = reduce_mean_110_axes_0, keep_dims = reduce_mean_110_keep_dims_0, x = square_36_cast_fp16)[name = tensor("reduce_mean_110_cast_fp16")]; + tensor add_72_y_0_to_fp16 = const()[name = tensor("add_72_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_72_cast_fp16 = add(x = reduce_mean_110_cast_fp16, y = add_72_y_0_to_fp16)[name = tensor("add_72_cast_fp16")]; + tensor sqrt_36_cast_fp16 = sqrt(x = add_72_cast_fp16)[name = tensor("sqrt_36_cast_fp16")]; + tensor real_div_36_cast_fp16 = real_div(x = sub_72_cast_fp16, y = sqrt_36_cast_fp16)[name = tensor("real_div_36_cast_fp16")]; + tensor reshape_145_shape_0 = const()[name = tensor("reshape_145_shape_0"), val = tensor([2, 2560, 12, 12])]; + tensor reshape_145_cast_fp16 = reshape(shape = reshape_145_shape_0, x = real_div_36_cast_fp16)[name = tensor("reshape_145_cast_fp16")]; + tensor add_73_gamma_0_to_fp16 = const()[name = tensor("add_73_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1197013056)))]; + tensor add_73_beta_0_to_fp16 = const()[name = tensor("add_73_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1197018240)))]; + tensor add_73_epsilon_0_to_fp16 = const()[name = tensor("add_73_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_73_cast_fp16 = batch_norm(beta = add_73_beta_0_to_fp16, epsilon = add_73_epsilon_0_to_fp16, gamma = add_73_gamma_0_to_fp16, mean = add_55_mean_0_to_fp16, variance = add_55_variance_0_to_fp16, x = reshape_145_cast_fp16)[name = tensor("add_73_cast_fp16")]; + tensor input_315_cast_fp16 = silu(x = add_73_cast_fp16)[name = tensor("input_315_cast_fp16")]; + tensor var_6621 = const()[name = tensor("op_6621"), val = tensor([1, 1])]; + tensor var_6623 = const()[name = tensor("op_6623"), val = tensor([1, 1])]; + tensor hidden_states_179_pad_type_0 = const()[name = tensor("hidden_states_179_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_179_pad_0 = const()[name = tensor("hidden_states_179_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_1_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1197023424)))]; + tensor up_blocks_1_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1256005888)))]; + tensor hidden_states_179_cast_fp16 = conv(bias = up_blocks_1_resnets_1_conv1_bias_to_fp16, dilations = var_6623, groups = var_5599, pad = hidden_states_179_pad_0, pad_type = hidden_states_179_pad_type_0, strides = var_6621, weight = up_blocks_1_resnets_1_conv1_weight_to_fp16, x = input_315_cast_fp16)[name = tensor("hidden_states_179_cast_fp16")]; + tensor var_6629 = const()[name = tensor("op_6629"), val = tensor([1, 1])]; + tensor var_6631 = const()[name = tensor("op_6631"), val = tensor([1, 1])]; + tensor temb_29_pad_type_0 = const()[name = tensor("temb_29_pad_type_0"), val = tensor("custom")]; + tensor temb_29_pad_0 = const()[name = tensor("temb_29_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1256008512)))]; + tensor up_blocks_1_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1259285376)))]; + tensor temb_29_cast_fp16 = conv(bias = up_blocks_1_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_6631, groups = var_5599, pad = temb_29_pad_0, pad_type = temb_29_pad_type_0, strides = var_6629, weight = up_blocks_1_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_29_cast_fp16")]; + tensor input_319_cast_fp16 = add(x = hidden_states_179_cast_fp16, y = temb_29_cast_fp16)[name = tensor("input_319_cast_fp16")]; + tensor reshape_148_shape_0 = const()[name = tensor("reshape_148_shape_0"), val = tensor([2, 32, 40, 12, 12])]; + tensor reshape_148_cast_fp16 = reshape(shape = reshape_148_shape_0, x = input_319_cast_fp16)[name = tensor("reshape_148_cast_fp16")]; + tensor reduce_mean_111_axes_0 = const()[name = tensor("reduce_mean_111_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_111_keep_dims_0 = const()[name = tensor("reduce_mean_111_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_111_cast_fp16 = reduce_mean(axes = reduce_mean_111_axes_0, keep_dims = reduce_mean_111_keep_dims_0, x = reshape_148_cast_fp16)[name = tensor("reduce_mean_111_cast_fp16")]; + tensor sub_74_cast_fp16 = sub(x = reshape_148_cast_fp16, y = reduce_mean_111_cast_fp16)[name = tensor("sub_74_cast_fp16")]; + tensor square_37_cast_fp16 = square(x = sub_74_cast_fp16)[name = tensor("square_37_cast_fp16")]; + tensor reduce_mean_113_axes_0 = const()[name = tensor("reduce_mean_113_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_113_keep_dims_0 = const()[name = tensor("reduce_mean_113_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_113_cast_fp16 = reduce_mean(axes = reduce_mean_113_axes_0, keep_dims = reduce_mean_113_keep_dims_0, x = square_37_cast_fp16)[name = tensor("reduce_mean_113_cast_fp16")]; + tensor add_74_y_0_to_fp16 = const()[name = tensor("add_74_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_74_cast_fp16 = add(x = reduce_mean_113_cast_fp16, y = add_74_y_0_to_fp16)[name = tensor("add_74_cast_fp16")]; + tensor sqrt_37_cast_fp16 = sqrt(x = add_74_cast_fp16)[name = tensor("sqrt_37_cast_fp16")]; + tensor real_div_37_cast_fp16 = real_div(x = sub_74_cast_fp16, y = sqrt_37_cast_fp16)[name = tensor("real_div_37_cast_fp16")]; + tensor reshape_149_shape_0 = const()[name = tensor("reshape_149_shape_0"), val = tensor([2, 1280, 12, 12])]; + tensor reshape_149_cast_fp16 = reshape(shape = reshape_149_shape_0, x = real_div_37_cast_fp16)[name = tensor("reshape_149_cast_fp16")]; + tensor add_75_gamma_0_to_fp16 = const()[name = tensor("add_75_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1259288000)))]; + tensor add_75_beta_0_to_fp16 = const()[name = tensor("add_75_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1259290624)))]; + tensor add_75_epsilon_0_to_fp16 = const()[name = tensor("add_75_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_75_cast_fp16 = batch_norm(beta = add_75_beta_0_to_fp16, epsilon = add_75_epsilon_0_to_fp16, gamma = add_75_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_149_cast_fp16)[name = tensor("add_75_cast_fp16")]; + tensor input_323_cast_fp16 = silu(x = add_75_cast_fp16)[name = tensor("input_323_cast_fp16")]; + tensor var_6641 = const()[name = tensor("op_6641"), val = tensor([1, 1])]; + tensor var_6643 = const()[name = tensor("op_6643"), val = tensor([1, 1])]; + tensor hidden_states_181_pad_type_0 = const()[name = tensor("hidden_states_181_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_181_pad_0 = const()[name = tensor("hidden_states_181_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_1_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1259293248)))]; + tensor up_blocks_1_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1288784512)))]; + tensor hidden_states_181_cast_fp16 = conv(bias = up_blocks_1_resnets_1_conv2_bias_to_fp16, dilations = var_6643, groups = var_5599, pad = hidden_states_181_pad_0, pad_type = hidden_states_181_pad_type_0, strides = var_6641, weight = up_blocks_1_resnets_1_conv2_weight_to_fp16, x = input_323_cast_fp16)[name = tensor("hidden_states_181_cast_fp16")]; + tensor var_6648 = const()[name = tensor("op_6648"), val = tensor([1, 1])]; + tensor var_6650 = const()[name = tensor("op_6650"), val = tensor([1, 1])]; + tensor x_13_pad_type_0 = const()[name = tensor("x_13_pad_type_0"), val = tensor("custom")]; + tensor x_13_pad_0 = const()[name = tensor("x_13_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_resnets_1_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_1_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1288787136)))]; + tensor up_blocks_1_resnets_1_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_1_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1295340800)))]; + tensor x_13_cast_fp16 = conv(bias = up_blocks_1_resnets_1_conv_shortcut_bias_to_fp16, dilations = var_6650, groups = var_5599, pad = x_13_pad_0, pad_type = x_13_pad_type_0, strides = var_6648, weight = up_blocks_1_resnets_1_conv_shortcut_weight_to_fp16, x = input_311_cast_fp16)[name = tensor("x_13_cast_fp16")]; + tensor hidden_states_183_cast_fp16 = add(x = x_13_cast_fp16, y = hidden_states_181_cast_fp16)[name = tensor("hidden_states_183_cast_fp16")]; + tensor reshape_152_shape_0 = const()[name = tensor("reshape_152_shape_0"), val = tensor([2, 32, 40, 12, 12])]; + tensor reshape_152_cast_fp16 = reshape(shape = reshape_152_shape_0, x = hidden_states_183_cast_fp16)[name = tensor("reshape_152_cast_fp16")]; + tensor reduce_mean_114_axes_0 = const()[name = tensor("reduce_mean_114_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_114_keep_dims_0 = const()[name = tensor("reduce_mean_114_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_114_cast_fp16 = reduce_mean(axes = reduce_mean_114_axes_0, keep_dims = reduce_mean_114_keep_dims_0, x = reshape_152_cast_fp16)[name = tensor("reduce_mean_114_cast_fp16")]; + tensor sub_76_cast_fp16 = sub(x = reshape_152_cast_fp16, y = reduce_mean_114_cast_fp16)[name = tensor("sub_76_cast_fp16")]; + tensor square_38_cast_fp16 = square(x = sub_76_cast_fp16)[name = tensor("square_38_cast_fp16")]; + tensor reduce_mean_116_axes_0 = const()[name = tensor("reduce_mean_116_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_116_keep_dims_0 = const()[name = tensor("reduce_mean_116_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_116_cast_fp16 = reduce_mean(axes = reduce_mean_116_axes_0, keep_dims = reduce_mean_116_keep_dims_0, x = square_38_cast_fp16)[name = tensor("reduce_mean_116_cast_fp16")]; + tensor add_76_y_0_to_fp16 = const()[name = tensor("add_76_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_76_cast_fp16 = add(x = reduce_mean_116_cast_fp16, y = add_76_y_0_to_fp16)[name = tensor("add_76_cast_fp16")]; + tensor sqrt_38_cast_fp16 = sqrt(x = add_76_cast_fp16)[name = tensor("sqrt_38_cast_fp16")]; + tensor real_div_38_cast_fp16 = real_div(x = sub_76_cast_fp16, y = sqrt_38_cast_fp16)[name = tensor("real_div_38_cast_fp16")]; + tensor reshape_153_shape_0 = const()[name = tensor("reshape_153_shape_0"), val = tensor([2, 1280, 12, 12])]; + tensor reshape_153_cast_fp16 = reshape(shape = reshape_153_shape_0, x = real_div_38_cast_fp16)[name = tensor("reshape_153_cast_fp16")]; + tensor add_77_gamma_0_to_fp16 = const()[name = tensor("add_77_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1295343424)))]; + tensor add_77_beta_0_to_fp16 = const()[name = tensor("add_77_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1295346048)))]; + tensor add_77_epsilon_0_to_fp16 = const()[name = tensor("add_77_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_77_cast_fp16 = batch_norm(beta = add_77_beta_0_to_fp16, epsilon = add_77_epsilon_0_to_fp16, gamma = add_77_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_153_cast_fp16)[name = tensor("add_77_cast_fp16")]; + tensor var_6670 = const()[name = tensor("op_6670"), val = tensor([1, 1])]; + tensor var_6672 = const()[name = tensor("op_6672"), val = tensor([1, 1])]; + tensor hidden_states_185_pad_type_0 = const()[name = tensor("hidden_states_185_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_185_pad_0 = const()[name = tensor("hidden_states_185_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_proj_in_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1295348672)))]; + tensor up_blocks_1_attentions_1_proj_in_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1298625536)))]; + tensor hidden_states_185_cast_fp16 = conv(bias = up_blocks_1_attentions_1_proj_in_bias_to_fp16, dilations = var_6672, groups = var_5599, pad = hidden_states_185_pad_0, pad_type = hidden_states_185_pad_type_0, strides = var_6670, weight = up_blocks_1_attentions_1_proj_in_weight_to_fp16, x = add_77_cast_fp16)[name = tensor("hidden_states_185_cast_fp16")]; + tensor var_6677 = const()[name = tensor("op_6677"), val = tensor([2, 1280, 1, 144])]; + tensor inputs_49_cast_fp16 = reshape(shape = var_6677, x = hidden_states_185_cast_fp16)[name = tensor("inputs_49_cast_fp16")]; + tensor var_6687 = const()[name = tensor("op_6687"), val = tensor([1])]; + tensor channels_mean_49_cast_fp16 = reduce_mean(axes = var_6687, keep_dims = var_5594, x = inputs_49_cast_fp16)[name = tensor("channels_mean_49_cast_fp16")]; + tensor zero_mean_49_cast_fp16 = sub(x = inputs_49_cast_fp16, y = channels_mean_49_cast_fp16)[name = tensor("zero_mean_49_cast_fp16")]; + tensor zero_mean_sq_49_cast_fp16 = mul(x = zero_mean_49_cast_fp16, y = zero_mean_49_cast_fp16)[name = tensor("zero_mean_sq_49_cast_fp16")]; + tensor var_6691 = const()[name = tensor("op_6691"), val = tensor([1])]; + tensor var_6692_cast_fp16 = reduce_mean(axes = var_6691, keep_dims = var_5594, x = zero_mean_sq_49_cast_fp16)[name = tensor("op_6692_cast_fp16")]; + tensor var_6693_to_fp16 = const()[name = tensor("op_6693_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_6694_cast_fp16 = add(x = var_6692_cast_fp16, y = var_6693_to_fp16)[name = tensor("op_6694_cast_fp16")]; + tensor denom_49_epsilon_0_to_fp16 = const()[name = tensor("denom_49_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_49_cast_fp16 = rsqrt(epsilon = denom_49_epsilon_0_to_fp16, x = var_6694_cast_fp16)[name = tensor("denom_49_cast_fp16")]; + tensor out_49_cast_fp16 = mul(x = zero_mean_49_cast_fp16, y = denom_49_cast_fp16)[name = tensor("out_49_cast_fp16")]; + tensor var_6698_to_fp16 = const()[name = tensor("op_6698_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1298628160)))]; + tensor var_6699_cast_fp16 = add(x = out_49_cast_fp16, y = var_6698_to_fp16)[name = tensor("op_6699_cast_fp16")]; + tensor var_6701_to_fp16 = const()[name = tensor("op_6701_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1298630784)))]; + tensor hidden_states_187_cast_fp16 = mul(x = var_6699_cast_fp16, y = var_6701_to_fp16)[name = tensor("hidden_states_187_cast_fp16")]; + tensor var_6708 = const()[name = tensor("op_6708"), val = tensor([1, 1])]; + tensor var_6710 = const()[name = tensor("op_6710"), val = tensor([1, 1])]; + tensor q_33_pad_type_0 = const()[name = tensor("q_33_pad_type_0"), val = tensor("custom")]; + tensor q_33_pad_0 = const()[name = tensor("q_33_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1298633408)))]; + tensor q_33_cast_fp16 = conv(dilations = var_6710, groups = var_5599, pad = q_33_pad_0, pad_type = q_33_pad_type_0, strides = var_6708, weight = up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_187_cast_fp16)[name = tensor("q_33_cast_fp16")]; + tensor var_6714 = const()[name = tensor("op_6714"), val = tensor([1, 1])]; + tensor var_6716 = const()[name = tensor("op_6716"), val = tensor([1, 1])]; + tensor k_65_pad_type_0 = const()[name = tensor("k_65_pad_type_0"), val = tensor("custom")]; + tensor k_65_pad_0 = const()[name = tensor("k_65_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1301910272)))]; + tensor k_65_cast_fp16 = conv(dilations = var_6716, groups = var_5599, pad = k_65_pad_0, pad_type = k_65_pad_type_0, strides = var_6714, weight = up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_187_cast_fp16)[name = tensor("k_65_cast_fp16")]; + tensor var_6720 = const()[name = tensor("op_6720"), val = tensor([1, 1])]; + tensor var_6722 = const()[name = tensor("op_6722"), val = tensor([1, 1])]; + tensor v_33_pad_type_0 = const()[name = tensor("v_33_pad_type_0"), val = tensor("custom")]; + tensor v_33_pad_0 = const()[name = tensor("v_33_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1305187136)))]; + tensor v_33_cast_fp16 = conv(dilations = var_6722, groups = var_5599, pad = v_33_pad_0, pad_type = v_33_pad_type_0, strides = var_6720, weight = up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_187_cast_fp16)[name = tensor("v_33_cast_fp16")]; + tensor var_6726_begin_0 = const()[name = tensor("op_6726_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_6726_end_0 = const()[name = tensor("op_6726_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_6726_end_mask_0 = const()[name = tensor("op_6726_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6726_cast_fp16 = slice_by_index(begin = var_6726_begin_0, end = var_6726_end_0, end_mask = var_6726_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6726_cast_fp16")]; + tensor var_6730_begin_0 = const()[name = tensor("op_6730_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_6730_end_0 = const()[name = tensor("op_6730_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_6730_end_mask_0 = const()[name = tensor("op_6730_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6730_cast_fp16 = slice_by_index(begin = var_6730_begin_0, end = var_6730_end_0, end_mask = var_6730_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6730_cast_fp16")]; + tensor var_6734_begin_0 = const()[name = tensor("op_6734_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_6734_end_0 = const()[name = tensor("op_6734_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_6734_end_mask_0 = const()[name = tensor("op_6734_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6734_cast_fp16 = slice_by_index(begin = var_6734_begin_0, end = var_6734_end_0, end_mask = var_6734_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6734_cast_fp16")]; + tensor var_6738_begin_0 = const()[name = tensor("op_6738_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_6738_end_0 = const()[name = tensor("op_6738_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_6738_end_mask_0 = const()[name = tensor("op_6738_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6738_cast_fp16 = slice_by_index(begin = var_6738_begin_0, end = var_6738_end_0, end_mask = var_6738_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6738_cast_fp16")]; + tensor var_6742_begin_0 = const()[name = tensor("op_6742_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_6742_end_0 = const()[name = tensor("op_6742_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_6742_end_mask_0 = const()[name = tensor("op_6742_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6742_cast_fp16 = slice_by_index(begin = var_6742_begin_0, end = var_6742_end_0, end_mask = var_6742_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6742_cast_fp16")]; + tensor var_6746_begin_0 = const()[name = tensor("op_6746_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_6746_end_0 = const()[name = tensor("op_6746_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_6746_end_mask_0 = const()[name = tensor("op_6746_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6746_cast_fp16 = slice_by_index(begin = var_6746_begin_0, end = var_6746_end_0, end_mask = var_6746_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6746_cast_fp16")]; + tensor var_6750_begin_0 = const()[name = tensor("op_6750_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_6750_end_0 = const()[name = tensor("op_6750_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_6750_end_mask_0 = const()[name = tensor("op_6750_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6750_cast_fp16 = slice_by_index(begin = var_6750_begin_0, end = var_6750_end_0, end_mask = var_6750_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6750_cast_fp16")]; + tensor var_6754_begin_0 = const()[name = tensor("op_6754_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_6754_end_0 = const()[name = tensor("op_6754_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_6754_end_mask_0 = const()[name = tensor("op_6754_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6754_cast_fp16 = slice_by_index(begin = var_6754_begin_0, end = var_6754_end_0, end_mask = var_6754_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6754_cast_fp16")]; + tensor var_6758_begin_0 = const()[name = tensor("op_6758_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_6758_end_0 = const()[name = tensor("op_6758_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_6758_end_mask_0 = const()[name = tensor("op_6758_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6758_cast_fp16 = slice_by_index(begin = var_6758_begin_0, end = var_6758_end_0, end_mask = var_6758_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6758_cast_fp16")]; + tensor var_6762_begin_0 = const()[name = tensor("op_6762_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_6762_end_0 = const()[name = tensor("op_6762_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_6762_end_mask_0 = const()[name = tensor("op_6762_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6762_cast_fp16 = slice_by_index(begin = var_6762_begin_0, end = var_6762_end_0, end_mask = var_6762_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6762_cast_fp16")]; + tensor var_6766_begin_0 = const()[name = tensor("op_6766_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_6766_end_0 = const()[name = tensor("op_6766_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_6766_end_mask_0 = const()[name = tensor("op_6766_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6766_cast_fp16 = slice_by_index(begin = var_6766_begin_0, end = var_6766_end_0, end_mask = var_6766_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6766_cast_fp16")]; + tensor var_6770_begin_0 = const()[name = tensor("op_6770_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_6770_end_0 = const()[name = tensor("op_6770_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_6770_end_mask_0 = const()[name = tensor("op_6770_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6770_cast_fp16 = slice_by_index(begin = var_6770_begin_0, end = var_6770_end_0, end_mask = var_6770_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6770_cast_fp16")]; + tensor var_6774_begin_0 = const()[name = tensor("op_6774_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_6774_end_0 = const()[name = tensor("op_6774_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_6774_end_mask_0 = const()[name = tensor("op_6774_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6774_cast_fp16 = slice_by_index(begin = var_6774_begin_0, end = var_6774_end_0, end_mask = var_6774_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6774_cast_fp16")]; + tensor var_6778_begin_0 = const()[name = tensor("op_6778_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_6778_end_0 = const()[name = tensor("op_6778_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_6778_end_mask_0 = const()[name = tensor("op_6778_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6778_cast_fp16 = slice_by_index(begin = var_6778_begin_0, end = var_6778_end_0, end_mask = var_6778_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6778_cast_fp16")]; + tensor var_6782_begin_0 = const()[name = tensor("op_6782_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_6782_end_0 = const()[name = tensor("op_6782_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_6782_end_mask_0 = const()[name = tensor("op_6782_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6782_cast_fp16 = slice_by_index(begin = var_6782_begin_0, end = var_6782_end_0, end_mask = var_6782_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6782_cast_fp16")]; + tensor var_6786_begin_0 = const()[name = tensor("op_6786_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_6786_end_0 = const()[name = tensor("op_6786_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_6786_end_mask_0 = const()[name = tensor("op_6786_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6786_cast_fp16 = slice_by_index(begin = var_6786_begin_0, end = var_6786_end_0, end_mask = var_6786_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6786_cast_fp16")]; + tensor var_6790_begin_0 = const()[name = tensor("op_6790_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_6790_end_0 = const()[name = tensor("op_6790_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_6790_end_mask_0 = const()[name = tensor("op_6790_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6790_cast_fp16 = slice_by_index(begin = var_6790_begin_0, end = var_6790_end_0, end_mask = var_6790_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6790_cast_fp16")]; + tensor var_6794_begin_0 = const()[name = tensor("op_6794_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_6794_end_0 = const()[name = tensor("op_6794_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_6794_end_mask_0 = const()[name = tensor("op_6794_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6794_cast_fp16 = slice_by_index(begin = var_6794_begin_0, end = var_6794_end_0, end_mask = var_6794_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6794_cast_fp16")]; + tensor var_6798_begin_0 = const()[name = tensor("op_6798_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_6798_end_0 = const()[name = tensor("op_6798_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_6798_end_mask_0 = const()[name = tensor("op_6798_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6798_cast_fp16 = slice_by_index(begin = var_6798_begin_0, end = var_6798_end_0, end_mask = var_6798_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6798_cast_fp16")]; + tensor var_6802_begin_0 = const()[name = tensor("op_6802_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_6802_end_0 = const()[name = tensor("op_6802_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_6802_end_mask_0 = const()[name = tensor("op_6802_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6802_cast_fp16 = slice_by_index(begin = var_6802_begin_0, end = var_6802_end_0, end_mask = var_6802_end_mask_0, x = q_33_cast_fp16)[name = tensor("op_6802_cast_fp16")]; + tensor k_67_perm_0 = const()[name = tensor("k_67_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_6809_begin_0 = const()[name = tensor("op_6809_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_6809_end_0 = const()[name = tensor("op_6809_end_0"), val = tensor([2, 144, 1, 64])]; + tensor var_6809_end_mask_0 = const()[name = tensor("op_6809_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_15 = transpose(perm = k_67_perm_0, x = k_65_cast_fp16)[name = tensor("transpose_15")]; + tensor var_6809_cast_fp16 = slice_by_index(begin = var_6809_begin_0, end = var_6809_end_0, end_mask = var_6809_end_mask_0, x = transpose_15)[name = tensor("op_6809_cast_fp16")]; + tensor var_6813_begin_0 = const()[name = tensor("op_6813_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_6813_end_0 = const()[name = tensor("op_6813_end_0"), val = tensor([2, 144, 1, 128])]; + tensor var_6813_end_mask_0 = const()[name = tensor("op_6813_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6813_cast_fp16 = slice_by_index(begin = var_6813_begin_0, end = var_6813_end_0, end_mask = var_6813_end_mask_0, x = transpose_15)[name = tensor("op_6813_cast_fp16")]; + tensor var_6817_begin_0 = const()[name = tensor("op_6817_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_6817_end_0 = const()[name = tensor("op_6817_end_0"), val = tensor([2, 144, 1, 192])]; + tensor var_6817_end_mask_0 = const()[name = tensor("op_6817_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6817_cast_fp16 = slice_by_index(begin = var_6817_begin_0, end = var_6817_end_0, end_mask = var_6817_end_mask_0, x = transpose_15)[name = tensor("op_6817_cast_fp16")]; + tensor var_6821_begin_0 = const()[name = tensor("op_6821_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_6821_end_0 = const()[name = tensor("op_6821_end_0"), val = tensor([2, 144, 1, 256])]; + tensor var_6821_end_mask_0 = const()[name = tensor("op_6821_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6821_cast_fp16 = slice_by_index(begin = var_6821_begin_0, end = var_6821_end_0, end_mask = var_6821_end_mask_0, x = transpose_15)[name = tensor("op_6821_cast_fp16")]; + tensor var_6825_begin_0 = const()[name = tensor("op_6825_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_6825_end_0 = const()[name = tensor("op_6825_end_0"), val = tensor([2, 144, 1, 320])]; + tensor var_6825_end_mask_0 = const()[name = tensor("op_6825_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6825_cast_fp16 = slice_by_index(begin = var_6825_begin_0, end = var_6825_end_0, end_mask = var_6825_end_mask_0, x = transpose_15)[name = tensor("op_6825_cast_fp16")]; + tensor var_6829_begin_0 = const()[name = tensor("op_6829_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_6829_end_0 = const()[name = tensor("op_6829_end_0"), val = tensor([2, 144, 1, 384])]; + tensor var_6829_end_mask_0 = const()[name = tensor("op_6829_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6829_cast_fp16 = slice_by_index(begin = var_6829_begin_0, end = var_6829_end_0, end_mask = var_6829_end_mask_0, x = transpose_15)[name = tensor("op_6829_cast_fp16")]; + tensor var_6833_begin_0 = const()[name = tensor("op_6833_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_6833_end_0 = const()[name = tensor("op_6833_end_0"), val = tensor([2, 144, 1, 448])]; + tensor var_6833_end_mask_0 = const()[name = tensor("op_6833_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6833_cast_fp16 = slice_by_index(begin = var_6833_begin_0, end = var_6833_end_0, end_mask = var_6833_end_mask_0, x = transpose_15)[name = tensor("op_6833_cast_fp16")]; + tensor var_6837_begin_0 = const()[name = tensor("op_6837_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_6837_end_0 = const()[name = tensor("op_6837_end_0"), val = tensor([2, 144, 1, 512])]; + tensor var_6837_end_mask_0 = const()[name = tensor("op_6837_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6837_cast_fp16 = slice_by_index(begin = var_6837_begin_0, end = var_6837_end_0, end_mask = var_6837_end_mask_0, x = transpose_15)[name = tensor("op_6837_cast_fp16")]; + tensor var_6841_begin_0 = const()[name = tensor("op_6841_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_6841_end_0 = const()[name = tensor("op_6841_end_0"), val = tensor([2, 144, 1, 576])]; + tensor var_6841_end_mask_0 = const()[name = tensor("op_6841_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6841_cast_fp16 = slice_by_index(begin = var_6841_begin_0, end = var_6841_end_0, end_mask = var_6841_end_mask_0, x = transpose_15)[name = tensor("op_6841_cast_fp16")]; + tensor var_6845_begin_0 = const()[name = tensor("op_6845_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_6845_end_0 = const()[name = tensor("op_6845_end_0"), val = tensor([2, 144, 1, 640])]; + tensor var_6845_end_mask_0 = const()[name = tensor("op_6845_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6845_cast_fp16 = slice_by_index(begin = var_6845_begin_0, end = var_6845_end_0, end_mask = var_6845_end_mask_0, x = transpose_15)[name = tensor("op_6845_cast_fp16")]; + tensor var_6849_begin_0 = const()[name = tensor("op_6849_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_6849_end_0 = const()[name = tensor("op_6849_end_0"), val = tensor([2, 144, 1, 704])]; + tensor var_6849_end_mask_0 = const()[name = tensor("op_6849_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6849_cast_fp16 = slice_by_index(begin = var_6849_begin_0, end = var_6849_end_0, end_mask = var_6849_end_mask_0, x = transpose_15)[name = tensor("op_6849_cast_fp16")]; + tensor var_6853_begin_0 = const()[name = tensor("op_6853_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_6853_end_0 = const()[name = tensor("op_6853_end_0"), val = tensor([2, 144, 1, 768])]; + tensor var_6853_end_mask_0 = const()[name = tensor("op_6853_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6853_cast_fp16 = slice_by_index(begin = var_6853_begin_0, end = var_6853_end_0, end_mask = var_6853_end_mask_0, x = transpose_15)[name = tensor("op_6853_cast_fp16")]; + tensor var_6857_begin_0 = const()[name = tensor("op_6857_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_6857_end_0 = const()[name = tensor("op_6857_end_0"), val = tensor([2, 144, 1, 832])]; + tensor var_6857_end_mask_0 = const()[name = tensor("op_6857_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6857_cast_fp16 = slice_by_index(begin = var_6857_begin_0, end = var_6857_end_0, end_mask = var_6857_end_mask_0, x = transpose_15)[name = tensor("op_6857_cast_fp16")]; + tensor var_6861_begin_0 = const()[name = tensor("op_6861_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_6861_end_0 = const()[name = tensor("op_6861_end_0"), val = tensor([2, 144, 1, 896])]; + tensor var_6861_end_mask_0 = const()[name = tensor("op_6861_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6861_cast_fp16 = slice_by_index(begin = var_6861_begin_0, end = var_6861_end_0, end_mask = var_6861_end_mask_0, x = transpose_15)[name = tensor("op_6861_cast_fp16")]; + tensor var_6865_begin_0 = const()[name = tensor("op_6865_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_6865_end_0 = const()[name = tensor("op_6865_end_0"), val = tensor([2, 144, 1, 960])]; + tensor var_6865_end_mask_0 = const()[name = tensor("op_6865_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6865_cast_fp16 = slice_by_index(begin = var_6865_begin_0, end = var_6865_end_0, end_mask = var_6865_end_mask_0, x = transpose_15)[name = tensor("op_6865_cast_fp16")]; + tensor var_6869_begin_0 = const()[name = tensor("op_6869_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_6869_end_0 = const()[name = tensor("op_6869_end_0"), val = tensor([2, 144, 1, 1024])]; + tensor var_6869_end_mask_0 = const()[name = tensor("op_6869_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6869_cast_fp16 = slice_by_index(begin = var_6869_begin_0, end = var_6869_end_0, end_mask = var_6869_end_mask_0, x = transpose_15)[name = tensor("op_6869_cast_fp16")]; + tensor var_6873_begin_0 = const()[name = tensor("op_6873_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_6873_end_0 = const()[name = tensor("op_6873_end_0"), val = tensor([2, 144, 1, 1088])]; + tensor var_6873_end_mask_0 = const()[name = tensor("op_6873_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6873_cast_fp16 = slice_by_index(begin = var_6873_begin_0, end = var_6873_end_0, end_mask = var_6873_end_mask_0, x = transpose_15)[name = tensor("op_6873_cast_fp16")]; + tensor var_6877_begin_0 = const()[name = tensor("op_6877_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_6877_end_0 = const()[name = tensor("op_6877_end_0"), val = tensor([2, 144, 1, 1152])]; + tensor var_6877_end_mask_0 = const()[name = tensor("op_6877_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6877_cast_fp16 = slice_by_index(begin = var_6877_begin_0, end = var_6877_end_0, end_mask = var_6877_end_mask_0, x = transpose_15)[name = tensor("op_6877_cast_fp16")]; + tensor var_6881_begin_0 = const()[name = tensor("op_6881_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_6881_end_0 = const()[name = tensor("op_6881_end_0"), val = tensor([2, 144, 1, 1216])]; + tensor var_6881_end_mask_0 = const()[name = tensor("op_6881_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6881_cast_fp16 = slice_by_index(begin = var_6881_begin_0, end = var_6881_end_0, end_mask = var_6881_end_mask_0, x = transpose_15)[name = tensor("op_6881_cast_fp16")]; + tensor var_6885_begin_0 = const()[name = tensor("op_6885_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_6885_end_0 = const()[name = tensor("op_6885_end_0"), val = tensor([2, 144, 1, 1280])]; + tensor var_6885_end_mask_0 = const()[name = tensor("op_6885_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_6885_cast_fp16 = slice_by_index(begin = var_6885_begin_0, end = var_6885_end_0, end_mask = var_6885_end_mask_0, x = transpose_15)[name = tensor("op_6885_cast_fp16")]; + tensor var_6887_begin_0 = const()[name = tensor("op_6887_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_6887_end_0 = const()[name = tensor("op_6887_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_6887_end_mask_0 = const()[name = tensor("op_6887_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6887_cast_fp16 = slice_by_index(begin = var_6887_begin_0, end = var_6887_end_0, end_mask = var_6887_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6887_cast_fp16")]; + tensor var_6891_begin_0 = const()[name = tensor("op_6891_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_6891_end_0 = const()[name = tensor("op_6891_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_6891_end_mask_0 = const()[name = tensor("op_6891_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6891_cast_fp16 = slice_by_index(begin = var_6891_begin_0, end = var_6891_end_0, end_mask = var_6891_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6891_cast_fp16")]; + tensor var_6895_begin_0 = const()[name = tensor("op_6895_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_6895_end_0 = const()[name = tensor("op_6895_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_6895_end_mask_0 = const()[name = tensor("op_6895_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6895_cast_fp16 = slice_by_index(begin = var_6895_begin_0, end = var_6895_end_0, end_mask = var_6895_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6895_cast_fp16")]; + tensor var_6899_begin_0 = const()[name = tensor("op_6899_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_6899_end_0 = const()[name = tensor("op_6899_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_6899_end_mask_0 = const()[name = tensor("op_6899_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6899_cast_fp16 = slice_by_index(begin = var_6899_begin_0, end = var_6899_end_0, end_mask = var_6899_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6899_cast_fp16")]; + tensor var_6903_begin_0 = const()[name = tensor("op_6903_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_6903_end_0 = const()[name = tensor("op_6903_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_6903_end_mask_0 = const()[name = tensor("op_6903_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6903_cast_fp16 = slice_by_index(begin = var_6903_begin_0, end = var_6903_end_0, end_mask = var_6903_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6903_cast_fp16")]; + tensor var_6907_begin_0 = const()[name = tensor("op_6907_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_6907_end_0 = const()[name = tensor("op_6907_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_6907_end_mask_0 = const()[name = tensor("op_6907_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6907_cast_fp16 = slice_by_index(begin = var_6907_begin_0, end = var_6907_end_0, end_mask = var_6907_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6907_cast_fp16")]; + tensor var_6911_begin_0 = const()[name = tensor("op_6911_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_6911_end_0 = const()[name = tensor("op_6911_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_6911_end_mask_0 = const()[name = tensor("op_6911_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6911_cast_fp16 = slice_by_index(begin = var_6911_begin_0, end = var_6911_end_0, end_mask = var_6911_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6911_cast_fp16")]; + tensor var_6915_begin_0 = const()[name = tensor("op_6915_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_6915_end_0 = const()[name = tensor("op_6915_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_6915_end_mask_0 = const()[name = tensor("op_6915_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6915_cast_fp16 = slice_by_index(begin = var_6915_begin_0, end = var_6915_end_0, end_mask = var_6915_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6915_cast_fp16")]; + tensor var_6919_begin_0 = const()[name = tensor("op_6919_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_6919_end_0 = const()[name = tensor("op_6919_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_6919_end_mask_0 = const()[name = tensor("op_6919_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6919_cast_fp16 = slice_by_index(begin = var_6919_begin_0, end = var_6919_end_0, end_mask = var_6919_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6919_cast_fp16")]; + tensor var_6923_begin_0 = const()[name = tensor("op_6923_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_6923_end_0 = const()[name = tensor("op_6923_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_6923_end_mask_0 = const()[name = tensor("op_6923_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6923_cast_fp16 = slice_by_index(begin = var_6923_begin_0, end = var_6923_end_0, end_mask = var_6923_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6923_cast_fp16")]; + tensor var_6927_begin_0 = const()[name = tensor("op_6927_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_6927_end_0 = const()[name = tensor("op_6927_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_6927_end_mask_0 = const()[name = tensor("op_6927_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6927_cast_fp16 = slice_by_index(begin = var_6927_begin_0, end = var_6927_end_0, end_mask = var_6927_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6927_cast_fp16")]; + tensor var_6931_begin_0 = const()[name = tensor("op_6931_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_6931_end_0 = const()[name = tensor("op_6931_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_6931_end_mask_0 = const()[name = tensor("op_6931_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6931_cast_fp16 = slice_by_index(begin = var_6931_begin_0, end = var_6931_end_0, end_mask = var_6931_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6931_cast_fp16")]; + tensor var_6935_begin_0 = const()[name = tensor("op_6935_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_6935_end_0 = const()[name = tensor("op_6935_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_6935_end_mask_0 = const()[name = tensor("op_6935_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6935_cast_fp16 = slice_by_index(begin = var_6935_begin_0, end = var_6935_end_0, end_mask = var_6935_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6935_cast_fp16")]; + tensor var_6939_begin_0 = const()[name = tensor("op_6939_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_6939_end_0 = const()[name = tensor("op_6939_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_6939_end_mask_0 = const()[name = tensor("op_6939_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6939_cast_fp16 = slice_by_index(begin = var_6939_begin_0, end = var_6939_end_0, end_mask = var_6939_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6939_cast_fp16")]; + tensor var_6943_begin_0 = const()[name = tensor("op_6943_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_6943_end_0 = const()[name = tensor("op_6943_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_6943_end_mask_0 = const()[name = tensor("op_6943_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6943_cast_fp16 = slice_by_index(begin = var_6943_begin_0, end = var_6943_end_0, end_mask = var_6943_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6943_cast_fp16")]; + tensor var_6947_begin_0 = const()[name = tensor("op_6947_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_6947_end_0 = const()[name = tensor("op_6947_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_6947_end_mask_0 = const()[name = tensor("op_6947_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6947_cast_fp16 = slice_by_index(begin = var_6947_begin_0, end = var_6947_end_0, end_mask = var_6947_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6947_cast_fp16")]; + tensor var_6951_begin_0 = const()[name = tensor("op_6951_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_6951_end_0 = const()[name = tensor("op_6951_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_6951_end_mask_0 = const()[name = tensor("op_6951_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6951_cast_fp16 = slice_by_index(begin = var_6951_begin_0, end = var_6951_end_0, end_mask = var_6951_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6951_cast_fp16")]; + tensor var_6955_begin_0 = const()[name = tensor("op_6955_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_6955_end_0 = const()[name = tensor("op_6955_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_6955_end_mask_0 = const()[name = tensor("op_6955_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6955_cast_fp16 = slice_by_index(begin = var_6955_begin_0, end = var_6955_end_0, end_mask = var_6955_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6955_cast_fp16")]; + tensor var_6959_begin_0 = const()[name = tensor("op_6959_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_6959_end_0 = const()[name = tensor("op_6959_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_6959_end_mask_0 = const()[name = tensor("op_6959_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6959_cast_fp16 = slice_by_index(begin = var_6959_begin_0, end = var_6959_end_0, end_mask = var_6959_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6959_cast_fp16")]; + tensor var_6963_begin_0 = const()[name = tensor("op_6963_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_6963_end_0 = const()[name = tensor("op_6963_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_6963_end_mask_0 = const()[name = tensor("op_6963_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_6963_cast_fp16 = slice_by_index(begin = var_6963_begin_0, end = var_6963_end_0, end_mask = var_6963_end_mask_0, x = v_33_cast_fp16)[name = tensor("op_6963_cast_fp16")]; + tensor var_6967_equation_0 = const()[name = tensor("op_6967_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6967_cast_fp16 = einsum(equation = var_6967_equation_0, values = (var_6809_cast_fp16, var_6726_cast_fp16))[name = tensor("op_6967_cast_fp16")]; + tensor var_6968_to_fp16 = const()[name = tensor("op_6968_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_441_cast_fp16 = mul(x = var_6967_cast_fp16, y = var_6968_to_fp16)[name = tensor("aw_441_cast_fp16")]; + tensor var_6971_equation_0 = const()[name = tensor("op_6971_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6971_cast_fp16 = einsum(equation = var_6971_equation_0, values = (var_6813_cast_fp16, var_6730_cast_fp16))[name = tensor("op_6971_cast_fp16")]; + tensor var_6972_to_fp16 = const()[name = tensor("op_6972_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_443_cast_fp16 = mul(x = var_6971_cast_fp16, y = var_6972_to_fp16)[name = tensor("aw_443_cast_fp16")]; + tensor var_6975_equation_0 = const()[name = tensor("op_6975_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6975_cast_fp16 = einsum(equation = var_6975_equation_0, values = (var_6817_cast_fp16, var_6734_cast_fp16))[name = tensor("op_6975_cast_fp16")]; + tensor var_6976_to_fp16 = const()[name = tensor("op_6976_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_445_cast_fp16 = mul(x = var_6975_cast_fp16, y = var_6976_to_fp16)[name = tensor("aw_445_cast_fp16")]; + tensor var_6979_equation_0 = const()[name = tensor("op_6979_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6979_cast_fp16 = einsum(equation = var_6979_equation_0, values = (var_6821_cast_fp16, var_6738_cast_fp16))[name = tensor("op_6979_cast_fp16")]; + tensor var_6980_to_fp16 = const()[name = tensor("op_6980_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_447_cast_fp16 = mul(x = var_6979_cast_fp16, y = var_6980_to_fp16)[name = tensor("aw_447_cast_fp16")]; + tensor var_6983_equation_0 = const()[name = tensor("op_6983_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6983_cast_fp16 = einsum(equation = var_6983_equation_0, values = (var_6825_cast_fp16, var_6742_cast_fp16))[name = tensor("op_6983_cast_fp16")]; + tensor var_6984_to_fp16 = const()[name = tensor("op_6984_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_449_cast_fp16 = mul(x = var_6983_cast_fp16, y = var_6984_to_fp16)[name = tensor("aw_449_cast_fp16")]; + tensor var_6987_equation_0 = const()[name = tensor("op_6987_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6987_cast_fp16 = einsum(equation = var_6987_equation_0, values = (var_6829_cast_fp16, var_6746_cast_fp16))[name = tensor("op_6987_cast_fp16")]; + tensor var_6988_to_fp16 = const()[name = tensor("op_6988_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_451_cast_fp16 = mul(x = var_6987_cast_fp16, y = var_6988_to_fp16)[name = tensor("aw_451_cast_fp16")]; + tensor var_6991_equation_0 = const()[name = tensor("op_6991_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6991_cast_fp16 = einsum(equation = var_6991_equation_0, values = (var_6833_cast_fp16, var_6750_cast_fp16))[name = tensor("op_6991_cast_fp16")]; + tensor var_6992_to_fp16 = const()[name = tensor("op_6992_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_453_cast_fp16 = mul(x = var_6991_cast_fp16, y = var_6992_to_fp16)[name = tensor("aw_453_cast_fp16")]; + tensor var_6995_equation_0 = const()[name = tensor("op_6995_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6995_cast_fp16 = einsum(equation = var_6995_equation_0, values = (var_6837_cast_fp16, var_6754_cast_fp16))[name = tensor("op_6995_cast_fp16")]; + tensor var_6996_to_fp16 = const()[name = tensor("op_6996_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_455_cast_fp16 = mul(x = var_6995_cast_fp16, y = var_6996_to_fp16)[name = tensor("aw_455_cast_fp16")]; + tensor var_6999_equation_0 = const()[name = tensor("op_6999_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_6999_cast_fp16 = einsum(equation = var_6999_equation_0, values = (var_6841_cast_fp16, var_6758_cast_fp16))[name = tensor("op_6999_cast_fp16")]; + tensor var_7000_to_fp16 = const()[name = tensor("op_7000_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_457_cast_fp16 = mul(x = var_6999_cast_fp16, y = var_7000_to_fp16)[name = tensor("aw_457_cast_fp16")]; + tensor var_7003_equation_0 = const()[name = tensor("op_7003_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7003_cast_fp16 = einsum(equation = var_7003_equation_0, values = (var_6845_cast_fp16, var_6762_cast_fp16))[name = tensor("op_7003_cast_fp16")]; + tensor var_7004_to_fp16 = const()[name = tensor("op_7004_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_459_cast_fp16 = mul(x = var_7003_cast_fp16, y = var_7004_to_fp16)[name = tensor("aw_459_cast_fp16")]; + tensor var_7007_equation_0 = const()[name = tensor("op_7007_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7007_cast_fp16 = einsum(equation = var_7007_equation_0, values = (var_6849_cast_fp16, var_6766_cast_fp16))[name = tensor("op_7007_cast_fp16")]; + tensor var_7008_to_fp16 = const()[name = tensor("op_7008_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_461_cast_fp16 = mul(x = var_7007_cast_fp16, y = var_7008_to_fp16)[name = tensor("aw_461_cast_fp16")]; + tensor var_7011_equation_0 = const()[name = tensor("op_7011_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7011_cast_fp16 = einsum(equation = var_7011_equation_0, values = (var_6853_cast_fp16, var_6770_cast_fp16))[name = tensor("op_7011_cast_fp16")]; + tensor var_7012_to_fp16 = const()[name = tensor("op_7012_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_463_cast_fp16 = mul(x = var_7011_cast_fp16, y = var_7012_to_fp16)[name = tensor("aw_463_cast_fp16")]; + tensor var_7015_equation_0 = const()[name = tensor("op_7015_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7015_cast_fp16 = einsum(equation = var_7015_equation_0, values = (var_6857_cast_fp16, var_6774_cast_fp16))[name = tensor("op_7015_cast_fp16")]; + tensor var_7016_to_fp16 = const()[name = tensor("op_7016_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_465_cast_fp16 = mul(x = var_7015_cast_fp16, y = var_7016_to_fp16)[name = tensor("aw_465_cast_fp16")]; + tensor var_7019_equation_0 = const()[name = tensor("op_7019_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7019_cast_fp16 = einsum(equation = var_7019_equation_0, values = (var_6861_cast_fp16, var_6778_cast_fp16))[name = tensor("op_7019_cast_fp16")]; + tensor var_7020_to_fp16 = const()[name = tensor("op_7020_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_467_cast_fp16 = mul(x = var_7019_cast_fp16, y = var_7020_to_fp16)[name = tensor("aw_467_cast_fp16")]; + tensor var_7023_equation_0 = const()[name = tensor("op_7023_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7023_cast_fp16 = einsum(equation = var_7023_equation_0, values = (var_6865_cast_fp16, var_6782_cast_fp16))[name = tensor("op_7023_cast_fp16")]; + tensor var_7024_to_fp16 = const()[name = tensor("op_7024_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_469_cast_fp16 = mul(x = var_7023_cast_fp16, y = var_7024_to_fp16)[name = tensor("aw_469_cast_fp16")]; + tensor var_7027_equation_0 = const()[name = tensor("op_7027_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7027_cast_fp16 = einsum(equation = var_7027_equation_0, values = (var_6869_cast_fp16, var_6786_cast_fp16))[name = tensor("op_7027_cast_fp16")]; + tensor var_7028_to_fp16 = const()[name = tensor("op_7028_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_471_cast_fp16 = mul(x = var_7027_cast_fp16, y = var_7028_to_fp16)[name = tensor("aw_471_cast_fp16")]; + tensor var_7031_equation_0 = const()[name = tensor("op_7031_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7031_cast_fp16 = einsum(equation = var_7031_equation_0, values = (var_6873_cast_fp16, var_6790_cast_fp16))[name = tensor("op_7031_cast_fp16")]; + tensor var_7032_to_fp16 = const()[name = tensor("op_7032_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_473_cast_fp16 = mul(x = var_7031_cast_fp16, y = var_7032_to_fp16)[name = tensor("aw_473_cast_fp16")]; + tensor var_7035_equation_0 = const()[name = tensor("op_7035_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7035_cast_fp16 = einsum(equation = var_7035_equation_0, values = (var_6877_cast_fp16, var_6794_cast_fp16))[name = tensor("op_7035_cast_fp16")]; + tensor var_7036_to_fp16 = const()[name = tensor("op_7036_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_475_cast_fp16 = mul(x = var_7035_cast_fp16, y = var_7036_to_fp16)[name = tensor("aw_475_cast_fp16")]; + tensor var_7039_equation_0 = const()[name = tensor("op_7039_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7039_cast_fp16 = einsum(equation = var_7039_equation_0, values = (var_6881_cast_fp16, var_6798_cast_fp16))[name = tensor("op_7039_cast_fp16")]; + tensor var_7040_to_fp16 = const()[name = tensor("op_7040_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_477_cast_fp16 = mul(x = var_7039_cast_fp16, y = var_7040_to_fp16)[name = tensor("aw_477_cast_fp16")]; + tensor var_7043_equation_0 = const()[name = tensor("op_7043_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7043_cast_fp16 = einsum(equation = var_7043_equation_0, values = (var_6885_cast_fp16, var_6802_cast_fp16))[name = tensor("op_7043_cast_fp16")]; + tensor var_7044_to_fp16 = const()[name = tensor("op_7044_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_479_cast_fp16 = mul(x = var_7043_cast_fp16, y = var_7044_to_fp16)[name = tensor("aw_479_cast_fp16")]; + tensor var_7046_cast_fp16 = softmax(axis = var_5599, x = aw_441_cast_fp16)[name = tensor("op_7046_cast_fp16")]; + tensor var_7047_cast_fp16 = softmax(axis = var_5599, x = aw_443_cast_fp16)[name = tensor("op_7047_cast_fp16")]; + tensor var_7048_cast_fp16 = softmax(axis = var_5599, x = aw_445_cast_fp16)[name = tensor("op_7048_cast_fp16")]; + tensor var_7049_cast_fp16 = softmax(axis = var_5599, x = aw_447_cast_fp16)[name = tensor("op_7049_cast_fp16")]; + tensor var_7050_cast_fp16 = softmax(axis = var_5599, x = aw_449_cast_fp16)[name = tensor("op_7050_cast_fp16")]; + tensor var_7051_cast_fp16 = softmax(axis = var_5599, x = aw_451_cast_fp16)[name = tensor("op_7051_cast_fp16")]; + tensor var_7052_cast_fp16 = softmax(axis = var_5599, x = aw_453_cast_fp16)[name = tensor("op_7052_cast_fp16")]; + tensor var_7053_cast_fp16 = softmax(axis = var_5599, x = aw_455_cast_fp16)[name = tensor("op_7053_cast_fp16")]; + tensor var_7054_cast_fp16 = softmax(axis = var_5599, x = aw_457_cast_fp16)[name = tensor("op_7054_cast_fp16")]; + tensor var_7055_cast_fp16 = softmax(axis = var_5599, x = aw_459_cast_fp16)[name = tensor("op_7055_cast_fp16")]; + tensor var_7056_cast_fp16 = softmax(axis = var_5599, x = aw_461_cast_fp16)[name = tensor("op_7056_cast_fp16")]; + tensor var_7057_cast_fp16 = softmax(axis = var_5599, x = aw_463_cast_fp16)[name = tensor("op_7057_cast_fp16")]; + tensor var_7058_cast_fp16 = softmax(axis = var_5599, x = aw_465_cast_fp16)[name = tensor("op_7058_cast_fp16")]; + tensor var_7059_cast_fp16 = softmax(axis = var_5599, x = aw_467_cast_fp16)[name = tensor("op_7059_cast_fp16")]; + tensor var_7060_cast_fp16 = softmax(axis = var_5599, x = aw_469_cast_fp16)[name = tensor("op_7060_cast_fp16")]; + tensor var_7061_cast_fp16 = softmax(axis = var_5599, x = aw_471_cast_fp16)[name = tensor("op_7061_cast_fp16")]; + tensor var_7062_cast_fp16 = softmax(axis = var_5599, x = aw_473_cast_fp16)[name = tensor("op_7062_cast_fp16")]; + tensor var_7063_cast_fp16 = softmax(axis = var_5599, x = aw_475_cast_fp16)[name = tensor("op_7063_cast_fp16")]; + tensor var_7064_cast_fp16 = softmax(axis = var_5599, x = aw_477_cast_fp16)[name = tensor("op_7064_cast_fp16")]; + tensor var_7065_cast_fp16 = softmax(axis = var_5599, x = aw_479_cast_fp16)[name = tensor("op_7065_cast_fp16")]; + tensor var_7067_equation_0 = const()[name = tensor("op_7067_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7067_cast_fp16 = einsum(equation = var_7067_equation_0, values = (var_6887_cast_fp16, var_7046_cast_fp16))[name = tensor("op_7067_cast_fp16")]; + tensor var_7069_equation_0 = const()[name = tensor("op_7069_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7069_cast_fp16 = einsum(equation = var_7069_equation_0, values = (var_6891_cast_fp16, var_7047_cast_fp16))[name = tensor("op_7069_cast_fp16")]; + tensor var_7071_equation_0 = const()[name = tensor("op_7071_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7071_cast_fp16 = einsum(equation = var_7071_equation_0, values = (var_6895_cast_fp16, var_7048_cast_fp16))[name = tensor("op_7071_cast_fp16")]; + tensor var_7073_equation_0 = const()[name = tensor("op_7073_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7073_cast_fp16 = einsum(equation = var_7073_equation_0, values = (var_6899_cast_fp16, var_7049_cast_fp16))[name = tensor("op_7073_cast_fp16")]; + tensor var_7075_equation_0 = const()[name = tensor("op_7075_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7075_cast_fp16 = einsum(equation = var_7075_equation_0, values = (var_6903_cast_fp16, var_7050_cast_fp16))[name = tensor("op_7075_cast_fp16")]; + tensor var_7077_equation_0 = const()[name = tensor("op_7077_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7077_cast_fp16 = einsum(equation = var_7077_equation_0, values = (var_6907_cast_fp16, var_7051_cast_fp16))[name = tensor("op_7077_cast_fp16")]; + tensor var_7079_equation_0 = const()[name = tensor("op_7079_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7079_cast_fp16 = einsum(equation = var_7079_equation_0, values = (var_6911_cast_fp16, var_7052_cast_fp16))[name = tensor("op_7079_cast_fp16")]; + tensor var_7081_equation_0 = const()[name = tensor("op_7081_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7081_cast_fp16 = einsum(equation = var_7081_equation_0, values = (var_6915_cast_fp16, var_7053_cast_fp16))[name = tensor("op_7081_cast_fp16")]; + tensor var_7083_equation_0 = const()[name = tensor("op_7083_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7083_cast_fp16 = einsum(equation = var_7083_equation_0, values = (var_6919_cast_fp16, var_7054_cast_fp16))[name = tensor("op_7083_cast_fp16")]; + tensor var_7085_equation_0 = const()[name = tensor("op_7085_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7085_cast_fp16 = einsum(equation = var_7085_equation_0, values = (var_6923_cast_fp16, var_7055_cast_fp16))[name = tensor("op_7085_cast_fp16")]; + tensor var_7087_equation_0 = const()[name = tensor("op_7087_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7087_cast_fp16 = einsum(equation = var_7087_equation_0, values = (var_6927_cast_fp16, var_7056_cast_fp16))[name = tensor("op_7087_cast_fp16")]; + tensor var_7089_equation_0 = const()[name = tensor("op_7089_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7089_cast_fp16 = einsum(equation = var_7089_equation_0, values = (var_6931_cast_fp16, var_7057_cast_fp16))[name = tensor("op_7089_cast_fp16")]; + tensor var_7091_equation_0 = const()[name = tensor("op_7091_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7091_cast_fp16 = einsum(equation = var_7091_equation_0, values = (var_6935_cast_fp16, var_7058_cast_fp16))[name = tensor("op_7091_cast_fp16")]; + tensor var_7093_equation_0 = const()[name = tensor("op_7093_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7093_cast_fp16 = einsum(equation = var_7093_equation_0, values = (var_6939_cast_fp16, var_7059_cast_fp16))[name = tensor("op_7093_cast_fp16")]; + tensor var_7095_equation_0 = const()[name = tensor("op_7095_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7095_cast_fp16 = einsum(equation = var_7095_equation_0, values = (var_6943_cast_fp16, var_7060_cast_fp16))[name = tensor("op_7095_cast_fp16")]; + tensor var_7097_equation_0 = const()[name = tensor("op_7097_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7097_cast_fp16 = einsum(equation = var_7097_equation_0, values = (var_6947_cast_fp16, var_7061_cast_fp16))[name = tensor("op_7097_cast_fp16")]; + tensor var_7099_equation_0 = const()[name = tensor("op_7099_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7099_cast_fp16 = einsum(equation = var_7099_equation_0, values = (var_6951_cast_fp16, var_7062_cast_fp16))[name = tensor("op_7099_cast_fp16")]; + tensor var_7101_equation_0 = const()[name = tensor("op_7101_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7101_cast_fp16 = einsum(equation = var_7101_equation_0, values = (var_6955_cast_fp16, var_7063_cast_fp16))[name = tensor("op_7101_cast_fp16")]; + tensor var_7103_equation_0 = const()[name = tensor("op_7103_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7103_cast_fp16 = einsum(equation = var_7103_equation_0, values = (var_6959_cast_fp16, var_7064_cast_fp16))[name = tensor("op_7103_cast_fp16")]; + tensor var_7105_equation_0 = const()[name = tensor("op_7105_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7105_cast_fp16 = einsum(equation = var_7105_equation_0, values = (var_6963_cast_fp16, var_7065_cast_fp16))[name = tensor("op_7105_cast_fp16")]; + tensor input_327_interleave_0 = const()[name = tensor("input_327_interleave_0"), val = tensor(false)]; + tensor input_327_cast_fp16 = concat(axis = var_5599, interleave = input_327_interleave_0, values = (var_7067_cast_fp16, var_7069_cast_fp16, var_7071_cast_fp16, var_7073_cast_fp16, var_7075_cast_fp16, var_7077_cast_fp16, var_7079_cast_fp16, var_7081_cast_fp16, var_7083_cast_fp16, var_7085_cast_fp16, var_7087_cast_fp16, var_7089_cast_fp16, var_7091_cast_fp16, var_7093_cast_fp16, var_7095_cast_fp16, var_7097_cast_fp16, var_7099_cast_fp16, var_7101_cast_fp16, var_7103_cast_fp16, var_7105_cast_fp16))[name = tensor("input_327_cast_fp16")]; + tensor var_7111 = const()[name = tensor("op_7111"), val = tensor([1, 1])]; + tensor var_7113 = const()[name = tensor("op_7113"), val = tensor([1, 1])]; + tensor var_7115_pad_type_0 = const()[name = tensor("op_7115_pad_type_0"), val = tensor("custom")]; + tensor var_7115_pad_0 = const()[name = tensor("op_7115_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1308464000)))]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1311740864)))]; + tensor var_7115_cast_fp16 = conv(bias = up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_7113, groups = var_5599, pad = var_7115_pad_0, pad_type = var_7115_pad_type_0, strides = var_7111, weight = up_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_327_cast_fp16)[name = tensor("op_7115_cast_fp16")]; + tensor inputs_51_cast_fp16 = add(x = var_7115_cast_fp16, y = inputs_49_cast_fp16)[name = tensor("inputs_51_cast_fp16")]; + tensor var_7119 = const()[name = tensor("op_7119"), val = tensor([1])]; + tensor channels_mean_51_cast_fp16 = reduce_mean(axes = var_7119, keep_dims = var_5594, x = inputs_51_cast_fp16)[name = tensor("channels_mean_51_cast_fp16")]; + tensor zero_mean_51_cast_fp16 = sub(x = inputs_51_cast_fp16, y = channels_mean_51_cast_fp16)[name = tensor("zero_mean_51_cast_fp16")]; + tensor zero_mean_sq_51_cast_fp16 = mul(x = zero_mean_51_cast_fp16, y = zero_mean_51_cast_fp16)[name = tensor("zero_mean_sq_51_cast_fp16")]; + tensor var_7123 = const()[name = tensor("op_7123"), val = tensor([1])]; + tensor var_7124_cast_fp16 = reduce_mean(axes = var_7123, keep_dims = var_5594, x = zero_mean_sq_51_cast_fp16)[name = tensor("op_7124_cast_fp16")]; + tensor var_7125_to_fp16 = const()[name = tensor("op_7125_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_7126_cast_fp16 = add(x = var_7124_cast_fp16, y = var_7125_to_fp16)[name = tensor("op_7126_cast_fp16")]; + tensor denom_51_epsilon_0_to_fp16 = const()[name = tensor("denom_51_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_51_cast_fp16 = rsqrt(epsilon = denom_51_epsilon_0_to_fp16, x = var_7126_cast_fp16)[name = tensor("denom_51_cast_fp16")]; + tensor out_51_cast_fp16 = mul(x = zero_mean_51_cast_fp16, y = denom_51_cast_fp16)[name = tensor("out_51_cast_fp16")]; + tensor var_7130_to_fp16 = const()[name = tensor("op_7130_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1311743488)))]; + tensor var_7131_cast_fp16 = add(x = out_51_cast_fp16, y = var_7130_to_fp16)[name = tensor("op_7131_cast_fp16")]; + tensor var_7133_to_fp16 = const()[name = tensor("op_7133_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1311746112)))]; + tensor hidden_states_189_cast_fp16 = mul(x = var_7131_cast_fp16, y = var_7133_to_fp16)[name = tensor("hidden_states_189_cast_fp16")]; + tensor var_7140 = const()[name = tensor("op_7140"), val = tensor([1, 1])]; + tensor var_7142 = const()[name = tensor("op_7142"), val = tensor([1, 1])]; + tensor q_35_pad_type_0 = const()[name = tensor("q_35_pad_type_0"), val = tensor("custom")]; + tensor q_35_pad_0 = const()[name = tensor("q_35_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1311748736)))]; + tensor q_35_cast_fp16 = conv(dilations = var_7142, groups = var_5599, pad = q_35_pad_0, pad_type = q_35_pad_type_0, strides = var_7140, weight = up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_189_cast_fp16)[name = tensor("q_35_cast_fp16")]; + tensor var_7146 = const()[name = tensor("op_7146"), val = tensor([1, 1])]; + tensor var_7148 = const()[name = tensor("op_7148"), val = tensor([1, 1])]; + tensor k_69_pad_type_0 = const()[name = tensor("k_69_pad_type_0"), val = tensor("custom")]; + tensor k_69_pad_0 = const()[name = tensor("k_69_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1315025600)))]; + tensor k_69_cast_fp16 = conv(dilations = var_7148, groups = var_5599, pad = k_69_pad_0, pad_type = k_69_pad_type_0, strides = var_7146, weight = up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_69_cast_fp16")]; + tensor var_7152 = const()[name = tensor("op_7152"), val = tensor([1, 1])]; + tensor var_7154 = const()[name = tensor("op_7154"), val = tensor([1, 1])]; + tensor v_35_pad_type_0 = const()[name = tensor("v_35_pad_type_0"), val = tensor("custom")]; + tensor v_35_pad_0 = const()[name = tensor("v_35_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1317647104)))]; + tensor v_35_cast_fp16 = conv(dilations = var_7154, groups = var_5599, pad = v_35_pad_0, pad_type = v_35_pad_type_0, strides = var_7152, weight = up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_35_cast_fp16")]; + tensor var_7158_begin_0 = const()[name = tensor("op_7158_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_7158_end_0 = const()[name = tensor("op_7158_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_7158_end_mask_0 = const()[name = tensor("op_7158_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7158_cast_fp16 = slice_by_index(begin = var_7158_begin_0, end = var_7158_end_0, end_mask = var_7158_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7158_cast_fp16")]; + tensor var_7162_begin_0 = const()[name = tensor("op_7162_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_7162_end_0 = const()[name = tensor("op_7162_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_7162_end_mask_0 = const()[name = tensor("op_7162_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7162_cast_fp16 = slice_by_index(begin = var_7162_begin_0, end = var_7162_end_0, end_mask = var_7162_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7162_cast_fp16")]; + tensor var_7166_begin_0 = const()[name = tensor("op_7166_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_7166_end_0 = const()[name = tensor("op_7166_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_7166_end_mask_0 = const()[name = tensor("op_7166_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7166_cast_fp16 = slice_by_index(begin = var_7166_begin_0, end = var_7166_end_0, end_mask = var_7166_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7166_cast_fp16")]; + tensor var_7170_begin_0 = const()[name = tensor("op_7170_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_7170_end_0 = const()[name = tensor("op_7170_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_7170_end_mask_0 = const()[name = tensor("op_7170_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7170_cast_fp16 = slice_by_index(begin = var_7170_begin_0, end = var_7170_end_0, end_mask = var_7170_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7170_cast_fp16")]; + tensor var_7174_begin_0 = const()[name = tensor("op_7174_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_7174_end_0 = const()[name = tensor("op_7174_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_7174_end_mask_0 = const()[name = tensor("op_7174_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7174_cast_fp16 = slice_by_index(begin = var_7174_begin_0, end = var_7174_end_0, end_mask = var_7174_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7174_cast_fp16")]; + tensor var_7178_begin_0 = const()[name = tensor("op_7178_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_7178_end_0 = const()[name = tensor("op_7178_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_7178_end_mask_0 = const()[name = tensor("op_7178_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7178_cast_fp16 = slice_by_index(begin = var_7178_begin_0, end = var_7178_end_0, end_mask = var_7178_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7178_cast_fp16")]; + tensor var_7182_begin_0 = const()[name = tensor("op_7182_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_7182_end_0 = const()[name = tensor("op_7182_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_7182_end_mask_0 = const()[name = tensor("op_7182_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7182_cast_fp16 = slice_by_index(begin = var_7182_begin_0, end = var_7182_end_0, end_mask = var_7182_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7182_cast_fp16")]; + tensor var_7186_begin_0 = const()[name = tensor("op_7186_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_7186_end_0 = const()[name = tensor("op_7186_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_7186_end_mask_0 = const()[name = tensor("op_7186_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7186_cast_fp16 = slice_by_index(begin = var_7186_begin_0, end = var_7186_end_0, end_mask = var_7186_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7186_cast_fp16")]; + tensor var_7190_begin_0 = const()[name = tensor("op_7190_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_7190_end_0 = const()[name = tensor("op_7190_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_7190_end_mask_0 = const()[name = tensor("op_7190_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7190_cast_fp16 = slice_by_index(begin = var_7190_begin_0, end = var_7190_end_0, end_mask = var_7190_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7190_cast_fp16")]; + tensor var_7194_begin_0 = const()[name = tensor("op_7194_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_7194_end_0 = const()[name = tensor("op_7194_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_7194_end_mask_0 = const()[name = tensor("op_7194_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7194_cast_fp16 = slice_by_index(begin = var_7194_begin_0, end = var_7194_end_0, end_mask = var_7194_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7194_cast_fp16")]; + tensor var_7198_begin_0 = const()[name = tensor("op_7198_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_7198_end_0 = const()[name = tensor("op_7198_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_7198_end_mask_0 = const()[name = tensor("op_7198_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7198_cast_fp16 = slice_by_index(begin = var_7198_begin_0, end = var_7198_end_0, end_mask = var_7198_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7198_cast_fp16")]; + tensor var_7202_begin_0 = const()[name = tensor("op_7202_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_7202_end_0 = const()[name = tensor("op_7202_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_7202_end_mask_0 = const()[name = tensor("op_7202_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7202_cast_fp16 = slice_by_index(begin = var_7202_begin_0, end = var_7202_end_0, end_mask = var_7202_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7202_cast_fp16")]; + tensor var_7206_begin_0 = const()[name = tensor("op_7206_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_7206_end_0 = const()[name = tensor("op_7206_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_7206_end_mask_0 = const()[name = tensor("op_7206_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7206_cast_fp16 = slice_by_index(begin = var_7206_begin_0, end = var_7206_end_0, end_mask = var_7206_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7206_cast_fp16")]; + tensor var_7210_begin_0 = const()[name = tensor("op_7210_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_7210_end_0 = const()[name = tensor("op_7210_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_7210_end_mask_0 = const()[name = tensor("op_7210_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7210_cast_fp16 = slice_by_index(begin = var_7210_begin_0, end = var_7210_end_0, end_mask = var_7210_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7210_cast_fp16")]; + tensor var_7214_begin_0 = const()[name = tensor("op_7214_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_7214_end_0 = const()[name = tensor("op_7214_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_7214_end_mask_0 = const()[name = tensor("op_7214_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7214_cast_fp16 = slice_by_index(begin = var_7214_begin_0, end = var_7214_end_0, end_mask = var_7214_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7214_cast_fp16")]; + tensor var_7218_begin_0 = const()[name = tensor("op_7218_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_7218_end_0 = const()[name = tensor("op_7218_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_7218_end_mask_0 = const()[name = tensor("op_7218_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7218_cast_fp16 = slice_by_index(begin = var_7218_begin_0, end = var_7218_end_0, end_mask = var_7218_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7218_cast_fp16")]; + tensor var_7222_begin_0 = const()[name = tensor("op_7222_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_7222_end_0 = const()[name = tensor("op_7222_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_7222_end_mask_0 = const()[name = tensor("op_7222_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7222_cast_fp16 = slice_by_index(begin = var_7222_begin_0, end = var_7222_end_0, end_mask = var_7222_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7222_cast_fp16")]; + tensor var_7226_begin_0 = const()[name = tensor("op_7226_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_7226_end_0 = const()[name = tensor("op_7226_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_7226_end_mask_0 = const()[name = tensor("op_7226_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7226_cast_fp16 = slice_by_index(begin = var_7226_begin_0, end = var_7226_end_0, end_mask = var_7226_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7226_cast_fp16")]; + tensor var_7230_begin_0 = const()[name = tensor("op_7230_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_7230_end_0 = const()[name = tensor("op_7230_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_7230_end_mask_0 = const()[name = tensor("op_7230_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7230_cast_fp16 = slice_by_index(begin = var_7230_begin_0, end = var_7230_end_0, end_mask = var_7230_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7230_cast_fp16")]; + tensor var_7234_begin_0 = const()[name = tensor("op_7234_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_7234_end_0 = const()[name = tensor("op_7234_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_7234_end_mask_0 = const()[name = tensor("op_7234_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7234_cast_fp16 = slice_by_index(begin = var_7234_begin_0, end = var_7234_end_0, end_mask = var_7234_end_mask_0, x = q_35_cast_fp16)[name = tensor("op_7234_cast_fp16")]; + tensor k_71_perm_0 = const()[name = tensor("k_71_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_7241_begin_0 = const()[name = tensor("op_7241_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_7241_end_0 = const()[name = tensor("op_7241_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_7241_end_mask_0 = const()[name = tensor("op_7241_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_14 = transpose(perm = k_71_perm_0, x = k_69_cast_fp16)[name = tensor("transpose_14")]; + tensor var_7241_cast_fp16 = slice_by_index(begin = var_7241_begin_0, end = var_7241_end_0, end_mask = var_7241_end_mask_0, x = transpose_14)[name = tensor("op_7241_cast_fp16")]; + tensor var_7245_begin_0 = const()[name = tensor("op_7245_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_7245_end_0 = const()[name = tensor("op_7245_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_7245_end_mask_0 = const()[name = tensor("op_7245_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7245_cast_fp16 = slice_by_index(begin = var_7245_begin_0, end = var_7245_end_0, end_mask = var_7245_end_mask_0, x = transpose_14)[name = tensor("op_7245_cast_fp16")]; + tensor var_7249_begin_0 = const()[name = tensor("op_7249_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_7249_end_0 = const()[name = tensor("op_7249_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_7249_end_mask_0 = const()[name = tensor("op_7249_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7249_cast_fp16 = slice_by_index(begin = var_7249_begin_0, end = var_7249_end_0, end_mask = var_7249_end_mask_0, x = transpose_14)[name = tensor("op_7249_cast_fp16")]; + tensor var_7253_begin_0 = const()[name = tensor("op_7253_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_7253_end_0 = const()[name = tensor("op_7253_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_7253_end_mask_0 = const()[name = tensor("op_7253_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7253_cast_fp16 = slice_by_index(begin = var_7253_begin_0, end = var_7253_end_0, end_mask = var_7253_end_mask_0, x = transpose_14)[name = tensor("op_7253_cast_fp16")]; + tensor var_7257_begin_0 = const()[name = tensor("op_7257_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_7257_end_0 = const()[name = tensor("op_7257_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_7257_end_mask_0 = const()[name = tensor("op_7257_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7257_cast_fp16 = slice_by_index(begin = var_7257_begin_0, end = var_7257_end_0, end_mask = var_7257_end_mask_0, x = transpose_14)[name = tensor("op_7257_cast_fp16")]; + tensor var_7261_begin_0 = const()[name = tensor("op_7261_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_7261_end_0 = const()[name = tensor("op_7261_end_0"), val = tensor([2, 77, 1, 384])]; + tensor var_7261_end_mask_0 = const()[name = tensor("op_7261_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7261_cast_fp16 = slice_by_index(begin = var_7261_begin_0, end = var_7261_end_0, end_mask = var_7261_end_mask_0, x = transpose_14)[name = tensor("op_7261_cast_fp16")]; + tensor var_7265_begin_0 = const()[name = tensor("op_7265_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_7265_end_0 = const()[name = tensor("op_7265_end_0"), val = tensor([2, 77, 1, 448])]; + tensor var_7265_end_mask_0 = const()[name = tensor("op_7265_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7265_cast_fp16 = slice_by_index(begin = var_7265_begin_0, end = var_7265_end_0, end_mask = var_7265_end_mask_0, x = transpose_14)[name = tensor("op_7265_cast_fp16")]; + tensor var_7269_begin_0 = const()[name = tensor("op_7269_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_7269_end_0 = const()[name = tensor("op_7269_end_0"), val = tensor([2, 77, 1, 512])]; + tensor var_7269_end_mask_0 = const()[name = tensor("op_7269_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7269_cast_fp16 = slice_by_index(begin = var_7269_begin_0, end = var_7269_end_0, end_mask = var_7269_end_mask_0, x = transpose_14)[name = tensor("op_7269_cast_fp16")]; + tensor var_7273_begin_0 = const()[name = tensor("op_7273_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_7273_end_0 = const()[name = tensor("op_7273_end_0"), val = tensor([2, 77, 1, 576])]; + tensor var_7273_end_mask_0 = const()[name = tensor("op_7273_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7273_cast_fp16 = slice_by_index(begin = var_7273_begin_0, end = var_7273_end_0, end_mask = var_7273_end_mask_0, x = transpose_14)[name = tensor("op_7273_cast_fp16")]; + tensor var_7277_begin_0 = const()[name = tensor("op_7277_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_7277_end_0 = const()[name = tensor("op_7277_end_0"), val = tensor([2, 77, 1, 640])]; + tensor var_7277_end_mask_0 = const()[name = tensor("op_7277_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7277_cast_fp16 = slice_by_index(begin = var_7277_begin_0, end = var_7277_end_0, end_mask = var_7277_end_mask_0, x = transpose_14)[name = tensor("op_7277_cast_fp16")]; + tensor var_7281_begin_0 = const()[name = tensor("op_7281_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_7281_end_0 = const()[name = tensor("op_7281_end_0"), val = tensor([2, 77, 1, 704])]; + tensor var_7281_end_mask_0 = const()[name = tensor("op_7281_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7281_cast_fp16 = slice_by_index(begin = var_7281_begin_0, end = var_7281_end_0, end_mask = var_7281_end_mask_0, x = transpose_14)[name = tensor("op_7281_cast_fp16")]; + tensor var_7285_begin_0 = const()[name = tensor("op_7285_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_7285_end_0 = const()[name = tensor("op_7285_end_0"), val = tensor([2, 77, 1, 768])]; + tensor var_7285_end_mask_0 = const()[name = tensor("op_7285_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7285_cast_fp16 = slice_by_index(begin = var_7285_begin_0, end = var_7285_end_0, end_mask = var_7285_end_mask_0, x = transpose_14)[name = tensor("op_7285_cast_fp16")]; + tensor var_7289_begin_0 = const()[name = tensor("op_7289_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_7289_end_0 = const()[name = tensor("op_7289_end_0"), val = tensor([2, 77, 1, 832])]; + tensor var_7289_end_mask_0 = const()[name = tensor("op_7289_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7289_cast_fp16 = slice_by_index(begin = var_7289_begin_0, end = var_7289_end_0, end_mask = var_7289_end_mask_0, x = transpose_14)[name = tensor("op_7289_cast_fp16")]; + tensor var_7293_begin_0 = const()[name = tensor("op_7293_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_7293_end_0 = const()[name = tensor("op_7293_end_0"), val = tensor([2, 77, 1, 896])]; + tensor var_7293_end_mask_0 = const()[name = tensor("op_7293_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7293_cast_fp16 = slice_by_index(begin = var_7293_begin_0, end = var_7293_end_0, end_mask = var_7293_end_mask_0, x = transpose_14)[name = tensor("op_7293_cast_fp16")]; + tensor var_7297_begin_0 = const()[name = tensor("op_7297_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_7297_end_0 = const()[name = tensor("op_7297_end_0"), val = tensor([2, 77, 1, 960])]; + tensor var_7297_end_mask_0 = const()[name = tensor("op_7297_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7297_cast_fp16 = slice_by_index(begin = var_7297_begin_0, end = var_7297_end_0, end_mask = var_7297_end_mask_0, x = transpose_14)[name = tensor("op_7297_cast_fp16")]; + tensor var_7301_begin_0 = const()[name = tensor("op_7301_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_7301_end_0 = const()[name = tensor("op_7301_end_0"), val = tensor([2, 77, 1, 1024])]; + tensor var_7301_end_mask_0 = const()[name = tensor("op_7301_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7301_cast_fp16 = slice_by_index(begin = var_7301_begin_0, end = var_7301_end_0, end_mask = var_7301_end_mask_0, x = transpose_14)[name = tensor("op_7301_cast_fp16")]; + tensor var_7305_begin_0 = const()[name = tensor("op_7305_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_7305_end_0 = const()[name = tensor("op_7305_end_0"), val = tensor([2, 77, 1, 1088])]; + tensor var_7305_end_mask_0 = const()[name = tensor("op_7305_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7305_cast_fp16 = slice_by_index(begin = var_7305_begin_0, end = var_7305_end_0, end_mask = var_7305_end_mask_0, x = transpose_14)[name = tensor("op_7305_cast_fp16")]; + tensor var_7309_begin_0 = const()[name = tensor("op_7309_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_7309_end_0 = const()[name = tensor("op_7309_end_0"), val = tensor([2, 77, 1, 1152])]; + tensor var_7309_end_mask_0 = const()[name = tensor("op_7309_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7309_cast_fp16 = slice_by_index(begin = var_7309_begin_0, end = var_7309_end_0, end_mask = var_7309_end_mask_0, x = transpose_14)[name = tensor("op_7309_cast_fp16")]; + tensor var_7313_begin_0 = const()[name = tensor("op_7313_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_7313_end_0 = const()[name = tensor("op_7313_end_0"), val = tensor([2, 77, 1, 1216])]; + tensor var_7313_end_mask_0 = const()[name = tensor("op_7313_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7313_cast_fp16 = slice_by_index(begin = var_7313_begin_0, end = var_7313_end_0, end_mask = var_7313_end_mask_0, x = transpose_14)[name = tensor("op_7313_cast_fp16")]; + tensor var_7317_begin_0 = const()[name = tensor("op_7317_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_7317_end_0 = const()[name = tensor("op_7317_end_0"), val = tensor([2, 77, 1, 1280])]; + tensor var_7317_end_mask_0 = const()[name = tensor("op_7317_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7317_cast_fp16 = slice_by_index(begin = var_7317_begin_0, end = var_7317_end_0, end_mask = var_7317_end_mask_0, x = transpose_14)[name = tensor("op_7317_cast_fp16")]; + tensor var_7319_begin_0 = const()[name = tensor("op_7319_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_7319_end_0 = const()[name = tensor("op_7319_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_7319_end_mask_0 = const()[name = tensor("op_7319_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7319_cast_fp16 = slice_by_index(begin = var_7319_begin_0, end = var_7319_end_0, end_mask = var_7319_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7319_cast_fp16")]; + tensor var_7323_begin_0 = const()[name = tensor("op_7323_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_7323_end_0 = const()[name = tensor("op_7323_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_7323_end_mask_0 = const()[name = tensor("op_7323_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7323_cast_fp16 = slice_by_index(begin = var_7323_begin_0, end = var_7323_end_0, end_mask = var_7323_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7323_cast_fp16")]; + tensor var_7327_begin_0 = const()[name = tensor("op_7327_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_7327_end_0 = const()[name = tensor("op_7327_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_7327_end_mask_0 = const()[name = tensor("op_7327_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7327_cast_fp16 = slice_by_index(begin = var_7327_begin_0, end = var_7327_end_0, end_mask = var_7327_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7327_cast_fp16")]; + tensor var_7331_begin_0 = const()[name = tensor("op_7331_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_7331_end_0 = const()[name = tensor("op_7331_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_7331_end_mask_0 = const()[name = tensor("op_7331_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7331_cast_fp16 = slice_by_index(begin = var_7331_begin_0, end = var_7331_end_0, end_mask = var_7331_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7331_cast_fp16")]; + tensor var_7335_begin_0 = const()[name = tensor("op_7335_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_7335_end_0 = const()[name = tensor("op_7335_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_7335_end_mask_0 = const()[name = tensor("op_7335_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7335_cast_fp16 = slice_by_index(begin = var_7335_begin_0, end = var_7335_end_0, end_mask = var_7335_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7335_cast_fp16")]; + tensor var_7339_begin_0 = const()[name = tensor("op_7339_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_7339_end_0 = const()[name = tensor("op_7339_end_0"), val = tensor([2, 384, 1, 77])]; + tensor var_7339_end_mask_0 = const()[name = tensor("op_7339_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7339_cast_fp16 = slice_by_index(begin = var_7339_begin_0, end = var_7339_end_0, end_mask = var_7339_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7339_cast_fp16")]; + tensor var_7343_begin_0 = const()[name = tensor("op_7343_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_7343_end_0 = const()[name = tensor("op_7343_end_0"), val = tensor([2, 448, 1, 77])]; + tensor var_7343_end_mask_0 = const()[name = tensor("op_7343_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7343_cast_fp16 = slice_by_index(begin = var_7343_begin_0, end = var_7343_end_0, end_mask = var_7343_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7343_cast_fp16")]; + tensor var_7347_begin_0 = const()[name = tensor("op_7347_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_7347_end_0 = const()[name = tensor("op_7347_end_0"), val = tensor([2, 512, 1, 77])]; + tensor var_7347_end_mask_0 = const()[name = tensor("op_7347_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7347_cast_fp16 = slice_by_index(begin = var_7347_begin_0, end = var_7347_end_0, end_mask = var_7347_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7347_cast_fp16")]; + tensor var_7351_begin_0 = const()[name = tensor("op_7351_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_7351_end_0 = const()[name = tensor("op_7351_end_0"), val = tensor([2, 576, 1, 77])]; + tensor var_7351_end_mask_0 = const()[name = tensor("op_7351_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7351_cast_fp16 = slice_by_index(begin = var_7351_begin_0, end = var_7351_end_0, end_mask = var_7351_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7351_cast_fp16")]; + tensor var_7355_begin_0 = const()[name = tensor("op_7355_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_7355_end_0 = const()[name = tensor("op_7355_end_0"), val = tensor([2, 640, 1, 77])]; + tensor var_7355_end_mask_0 = const()[name = tensor("op_7355_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7355_cast_fp16 = slice_by_index(begin = var_7355_begin_0, end = var_7355_end_0, end_mask = var_7355_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7355_cast_fp16")]; + tensor var_7359_begin_0 = const()[name = tensor("op_7359_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_7359_end_0 = const()[name = tensor("op_7359_end_0"), val = tensor([2, 704, 1, 77])]; + tensor var_7359_end_mask_0 = const()[name = tensor("op_7359_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7359_cast_fp16 = slice_by_index(begin = var_7359_begin_0, end = var_7359_end_0, end_mask = var_7359_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7359_cast_fp16")]; + tensor var_7363_begin_0 = const()[name = tensor("op_7363_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_7363_end_0 = const()[name = tensor("op_7363_end_0"), val = tensor([2, 768, 1, 77])]; + tensor var_7363_end_mask_0 = const()[name = tensor("op_7363_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7363_cast_fp16 = slice_by_index(begin = var_7363_begin_0, end = var_7363_end_0, end_mask = var_7363_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7363_cast_fp16")]; + tensor var_7367_begin_0 = const()[name = tensor("op_7367_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_7367_end_0 = const()[name = tensor("op_7367_end_0"), val = tensor([2, 832, 1, 77])]; + tensor var_7367_end_mask_0 = const()[name = tensor("op_7367_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7367_cast_fp16 = slice_by_index(begin = var_7367_begin_0, end = var_7367_end_0, end_mask = var_7367_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7367_cast_fp16")]; + tensor var_7371_begin_0 = const()[name = tensor("op_7371_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_7371_end_0 = const()[name = tensor("op_7371_end_0"), val = tensor([2, 896, 1, 77])]; + tensor var_7371_end_mask_0 = const()[name = tensor("op_7371_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7371_cast_fp16 = slice_by_index(begin = var_7371_begin_0, end = var_7371_end_0, end_mask = var_7371_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7371_cast_fp16")]; + tensor var_7375_begin_0 = const()[name = tensor("op_7375_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_7375_end_0 = const()[name = tensor("op_7375_end_0"), val = tensor([2, 960, 1, 77])]; + tensor var_7375_end_mask_0 = const()[name = tensor("op_7375_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7375_cast_fp16 = slice_by_index(begin = var_7375_begin_0, end = var_7375_end_0, end_mask = var_7375_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7375_cast_fp16")]; + tensor var_7379_begin_0 = const()[name = tensor("op_7379_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_7379_end_0 = const()[name = tensor("op_7379_end_0"), val = tensor([2, 1024, 1, 77])]; + tensor var_7379_end_mask_0 = const()[name = tensor("op_7379_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7379_cast_fp16 = slice_by_index(begin = var_7379_begin_0, end = var_7379_end_0, end_mask = var_7379_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7379_cast_fp16")]; + tensor var_7383_begin_0 = const()[name = tensor("op_7383_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_7383_end_0 = const()[name = tensor("op_7383_end_0"), val = tensor([2, 1088, 1, 77])]; + tensor var_7383_end_mask_0 = const()[name = tensor("op_7383_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7383_cast_fp16 = slice_by_index(begin = var_7383_begin_0, end = var_7383_end_0, end_mask = var_7383_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7383_cast_fp16")]; + tensor var_7387_begin_0 = const()[name = tensor("op_7387_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_7387_end_0 = const()[name = tensor("op_7387_end_0"), val = tensor([2, 1152, 1, 77])]; + tensor var_7387_end_mask_0 = const()[name = tensor("op_7387_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7387_cast_fp16 = slice_by_index(begin = var_7387_begin_0, end = var_7387_end_0, end_mask = var_7387_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7387_cast_fp16")]; + tensor var_7391_begin_0 = const()[name = tensor("op_7391_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_7391_end_0 = const()[name = tensor("op_7391_end_0"), val = tensor([2, 1216, 1, 77])]; + tensor var_7391_end_mask_0 = const()[name = tensor("op_7391_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7391_cast_fp16 = slice_by_index(begin = var_7391_begin_0, end = var_7391_end_0, end_mask = var_7391_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7391_cast_fp16")]; + tensor var_7395_begin_0 = const()[name = tensor("op_7395_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_7395_end_0 = const()[name = tensor("op_7395_end_0"), val = tensor([2, 1280, 1, 77])]; + tensor var_7395_end_mask_0 = const()[name = tensor("op_7395_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7395_cast_fp16 = slice_by_index(begin = var_7395_begin_0, end = var_7395_end_0, end_mask = var_7395_end_mask_0, x = v_35_cast_fp16)[name = tensor("op_7395_cast_fp16")]; + tensor var_7399_equation_0 = const()[name = tensor("op_7399_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7399_cast_fp16 = einsum(equation = var_7399_equation_0, values = (var_7241_cast_fp16, var_7158_cast_fp16))[name = tensor("op_7399_cast_fp16")]; + tensor var_7400_to_fp16 = const()[name = tensor("op_7400_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_481_cast_fp16 = mul(x = var_7399_cast_fp16, y = var_7400_to_fp16)[name = tensor("aw_481_cast_fp16")]; + tensor var_7403_equation_0 = const()[name = tensor("op_7403_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7403_cast_fp16 = einsum(equation = var_7403_equation_0, values = (var_7245_cast_fp16, var_7162_cast_fp16))[name = tensor("op_7403_cast_fp16")]; + tensor var_7404_to_fp16 = const()[name = tensor("op_7404_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_483_cast_fp16 = mul(x = var_7403_cast_fp16, y = var_7404_to_fp16)[name = tensor("aw_483_cast_fp16")]; + tensor var_7407_equation_0 = const()[name = tensor("op_7407_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7407_cast_fp16 = einsum(equation = var_7407_equation_0, values = (var_7249_cast_fp16, var_7166_cast_fp16))[name = tensor("op_7407_cast_fp16")]; + tensor var_7408_to_fp16 = const()[name = tensor("op_7408_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_485_cast_fp16 = mul(x = var_7407_cast_fp16, y = var_7408_to_fp16)[name = tensor("aw_485_cast_fp16")]; + tensor var_7411_equation_0 = const()[name = tensor("op_7411_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7411_cast_fp16 = einsum(equation = var_7411_equation_0, values = (var_7253_cast_fp16, var_7170_cast_fp16))[name = tensor("op_7411_cast_fp16")]; + tensor var_7412_to_fp16 = const()[name = tensor("op_7412_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_487_cast_fp16 = mul(x = var_7411_cast_fp16, y = var_7412_to_fp16)[name = tensor("aw_487_cast_fp16")]; + tensor var_7415_equation_0 = const()[name = tensor("op_7415_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7415_cast_fp16 = einsum(equation = var_7415_equation_0, values = (var_7257_cast_fp16, var_7174_cast_fp16))[name = tensor("op_7415_cast_fp16")]; + tensor var_7416_to_fp16 = const()[name = tensor("op_7416_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_489_cast_fp16 = mul(x = var_7415_cast_fp16, y = var_7416_to_fp16)[name = tensor("aw_489_cast_fp16")]; + tensor var_7419_equation_0 = const()[name = tensor("op_7419_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7419_cast_fp16 = einsum(equation = var_7419_equation_0, values = (var_7261_cast_fp16, var_7178_cast_fp16))[name = tensor("op_7419_cast_fp16")]; + tensor var_7420_to_fp16 = const()[name = tensor("op_7420_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_491_cast_fp16 = mul(x = var_7419_cast_fp16, y = var_7420_to_fp16)[name = tensor("aw_491_cast_fp16")]; + tensor var_7423_equation_0 = const()[name = tensor("op_7423_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7423_cast_fp16 = einsum(equation = var_7423_equation_0, values = (var_7265_cast_fp16, var_7182_cast_fp16))[name = tensor("op_7423_cast_fp16")]; + tensor var_7424_to_fp16 = const()[name = tensor("op_7424_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_493_cast_fp16 = mul(x = var_7423_cast_fp16, y = var_7424_to_fp16)[name = tensor("aw_493_cast_fp16")]; + tensor var_7427_equation_0 = const()[name = tensor("op_7427_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7427_cast_fp16 = einsum(equation = var_7427_equation_0, values = (var_7269_cast_fp16, var_7186_cast_fp16))[name = tensor("op_7427_cast_fp16")]; + tensor var_7428_to_fp16 = const()[name = tensor("op_7428_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_495_cast_fp16 = mul(x = var_7427_cast_fp16, y = var_7428_to_fp16)[name = tensor("aw_495_cast_fp16")]; + tensor var_7431_equation_0 = const()[name = tensor("op_7431_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7431_cast_fp16 = einsum(equation = var_7431_equation_0, values = (var_7273_cast_fp16, var_7190_cast_fp16))[name = tensor("op_7431_cast_fp16")]; + tensor var_7432_to_fp16 = const()[name = tensor("op_7432_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_497_cast_fp16 = mul(x = var_7431_cast_fp16, y = var_7432_to_fp16)[name = tensor("aw_497_cast_fp16")]; + tensor var_7435_equation_0 = const()[name = tensor("op_7435_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7435_cast_fp16 = einsum(equation = var_7435_equation_0, values = (var_7277_cast_fp16, var_7194_cast_fp16))[name = tensor("op_7435_cast_fp16")]; + tensor var_7436_to_fp16 = const()[name = tensor("op_7436_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_499_cast_fp16 = mul(x = var_7435_cast_fp16, y = var_7436_to_fp16)[name = tensor("aw_499_cast_fp16")]; + tensor var_7439_equation_0 = const()[name = tensor("op_7439_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7439_cast_fp16 = einsum(equation = var_7439_equation_0, values = (var_7281_cast_fp16, var_7198_cast_fp16))[name = tensor("op_7439_cast_fp16")]; + tensor var_7440_to_fp16 = const()[name = tensor("op_7440_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_501_cast_fp16 = mul(x = var_7439_cast_fp16, y = var_7440_to_fp16)[name = tensor("aw_501_cast_fp16")]; + tensor var_7443_equation_0 = const()[name = tensor("op_7443_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7443_cast_fp16 = einsum(equation = var_7443_equation_0, values = (var_7285_cast_fp16, var_7202_cast_fp16))[name = tensor("op_7443_cast_fp16")]; + tensor var_7444_to_fp16 = const()[name = tensor("op_7444_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_503_cast_fp16 = mul(x = var_7443_cast_fp16, y = var_7444_to_fp16)[name = tensor("aw_503_cast_fp16")]; + tensor var_7447_equation_0 = const()[name = tensor("op_7447_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7447_cast_fp16 = einsum(equation = var_7447_equation_0, values = (var_7289_cast_fp16, var_7206_cast_fp16))[name = tensor("op_7447_cast_fp16")]; + tensor var_7448_to_fp16 = const()[name = tensor("op_7448_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_505_cast_fp16 = mul(x = var_7447_cast_fp16, y = var_7448_to_fp16)[name = tensor("aw_505_cast_fp16")]; + tensor var_7451_equation_0 = const()[name = tensor("op_7451_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7451_cast_fp16 = einsum(equation = var_7451_equation_0, values = (var_7293_cast_fp16, var_7210_cast_fp16))[name = tensor("op_7451_cast_fp16")]; + tensor var_7452_to_fp16 = const()[name = tensor("op_7452_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_507_cast_fp16 = mul(x = var_7451_cast_fp16, y = var_7452_to_fp16)[name = tensor("aw_507_cast_fp16")]; + tensor var_7455_equation_0 = const()[name = tensor("op_7455_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7455_cast_fp16 = einsum(equation = var_7455_equation_0, values = (var_7297_cast_fp16, var_7214_cast_fp16))[name = tensor("op_7455_cast_fp16")]; + tensor var_7456_to_fp16 = const()[name = tensor("op_7456_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_509_cast_fp16 = mul(x = var_7455_cast_fp16, y = var_7456_to_fp16)[name = tensor("aw_509_cast_fp16")]; + tensor var_7459_equation_0 = const()[name = tensor("op_7459_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7459_cast_fp16 = einsum(equation = var_7459_equation_0, values = (var_7301_cast_fp16, var_7218_cast_fp16))[name = tensor("op_7459_cast_fp16")]; + tensor var_7460_to_fp16 = const()[name = tensor("op_7460_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_511_cast_fp16 = mul(x = var_7459_cast_fp16, y = var_7460_to_fp16)[name = tensor("aw_511_cast_fp16")]; + tensor var_7463_equation_0 = const()[name = tensor("op_7463_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7463_cast_fp16 = einsum(equation = var_7463_equation_0, values = (var_7305_cast_fp16, var_7222_cast_fp16))[name = tensor("op_7463_cast_fp16")]; + tensor var_7464_to_fp16 = const()[name = tensor("op_7464_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_513_cast_fp16 = mul(x = var_7463_cast_fp16, y = var_7464_to_fp16)[name = tensor("aw_513_cast_fp16")]; + tensor var_7467_equation_0 = const()[name = tensor("op_7467_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7467_cast_fp16 = einsum(equation = var_7467_equation_0, values = (var_7309_cast_fp16, var_7226_cast_fp16))[name = tensor("op_7467_cast_fp16")]; + tensor var_7468_to_fp16 = const()[name = tensor("op_7468_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_515_cast_fp16 = mul(x = var_7467_cast_fp16, y = var_7468_to_fp16)[name = tensor("aw_515_cast_fp16")]; + tensor var_7471_equation_0 = const()[name = tensor("op_7471_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7471_cast_fp16 = einsum(equation = var_7471_equation_0, values = (var_7313_cast_fp16, var_7230_cast_fp16))[name = tensor("op_7471_cast_fp16")]; + tensor var_7472_to_fp16 = const()[name = tensor("op_7472_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_517_cast_fp16 = mul(x = var_7471_cast_fp16, y = var_7472_to_fp16)[name = tensor("aw_517_cast_fp16")]; + tensor var_7475_equation_0 = const()[name = tensor("op_7475_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7475_cast_fp16 = einsum(equation = var_7475_equation_0, values = (var_7317_cast_fp16, var_7234_cast_fp16))[name = tensor("op_7475_cast_fp16")]; + tensor var_7476_to_fp16 = const()[name = tensor("op_7476_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_519_cast_fp16 = mul(x = var_7475_cast_fp16, y = var_7476_to_fp16)[name = tensor("aw_519_cast_fp16")]; + tensor var_7478_cast_fp16 = softmax(axis = var_5599, x = aw_481_cast_fp16)[name = tensor("op_7478_cast_fp16")]; + tensor var_7479_cast_fp16 = softmax(axis = var_5599, x = aw_483_cast_fp16)[name = tensor("op_7479_cast_fp16")]; + tensor var_7480_cast_fp16 = softmax(axis = var_5599, x = aw_485_cast_fp16)[name = tensor("op_7480_cast_fp16")]; + tensor var_7481_cast_fp16 = softmax(axis = var_5599, x = aw_487_cast_fp16)[name = tensor("op_7481_cast_fp16")]; + tensor var_7482_cast_fp16 = softmax(axis = var_5599, x = aw_489_cast_fp16)[name = tensor("op_7482_cast_fp16")]; + tensor var_7483_cast_fp16 = softmax(axis = var_5599, x = aw_491_cast_fp16)[name = tensor("op_7483_cast_fp16")]; + tensor var_7484_cast_fp16 = softmax(axis = var_5599, x = aw_493_cast_fp16)[name = tensor("op_7484_cast_fp16")]; + tensor var_7485_cast_fp16 = softmax(axis = var_5599, x = aw_495_cast_fp16)[name = tensor("op_7485_cast_fp16")]; + tensor var_7486_cast_fp16 = softmax(axis = var_5599, x = aw_497_cast_fp16)[name = tensor("op_7486_cast_fp16")]; + tensor var_7487_cast_fp16 = softmax(axis = var_5599, x = aw_499_cast_fp16)[name = tensor("op_7487_cast_fp16")]; + tensor var_7488_cast_fp16 = softmax(axis = var_5599, x = aw_501_cast_fp16)[name = tensor("op_7488_cast_fp16")]; + tensor var_7489_cast_fp16 = softmax(axis = var_5599, x = aw_503_cast_fp16)[name = tensor("op_7489_cast_fp16")]; + tensor var_7490_cast_fp16 = softmax(axis = var_5599, x = aw_505_cast_fp16)[name = tensor("op_7490_cast_fp16")]; + tensor var_7491_cast_fp16 = softmax(axis = var_5599, x = aw_507_cast_fp16)[name = tensor("op_7491_cast_fp16")]; + tensor var_7492_cast_fp16 = softmax(axis = var_5599, x = aw_509_cast_fp16)[name = tensor("op_7492_cast_fp16")]; + tensor var_7493_cast_fp16 = softmax(axis = var_5599, x = aw_511_cast_fp16)[name = tensor("op_7493_cast_fp16")]; + tensor var_7494_cast_fp16 = softmax(axis = var_5599, x = aw_513_cast_fp16)[name = tensor("op_7494_cast_fp16")]; + tensor var_7495_cast_fp16 = softmax(axis = var_5599, x = aw_515_cast_fp16)[name = tensor("op_7495_cast_fp16")]; + tensor var_7496_cast_fp16 = softmax(axis = var_5599, x = aw_517_cast_fp16)[name = tensor("op_7496_cast_fp16")]; + tensor var_7497_cast_fp16 = softmax(axis = var_5599, x = aw_519_cast_fp16)[name = tensor("op_7497_cast_fp16")]; + tensor var_7499_equation_0 = const()[name = tensor("op_7499_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7499_cast_fp16 = einsum(equation = var_7499_equation_0, values = (var_7319_cast_fp16, var_7478_cast_fp16))[name = tensor("op_7499_cast_fp16")]; + tensor var_7501_equation_0 = const()[name = tensor("op_7501_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7501_cast_fp16 = einsum(equation = var_7501_equation_0, values = (var_7323_cast_fp16, var_7479_cast_fp16))[name = tensor("op_7501_cast_fp16")]; + tensor var_7503_equation_0 = const()[name = tensor("op_7503_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7503_cast_fp16 = einsum(equation = var_7503_equation_0, values = (var_7327_cast_fp16, var_7480_cast_fp16))[name = tensor("op_7503_cast_fp16")]; + tensor var_7505_equation_0 = const()[name = tensor("op_7505_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7505_cast_fp16 = einsum(equation = var_7505_equation_0, values = (var_7331_cast_fp16, var_7481_cast_fp16))[name = tensor("op_7505_cast_fp16")]; + tensor var_7507_equation_0 = const()[name = tensor("op_7507_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7507_cast_fp16 = einsum(equation = var_7507_equation_0, values = (var_7335_cast_fp16, var_7482_cast_fp16))[name = tensor("op_7507_cast_fp16")]; + tensor var_7509_equation_0 = const()[name = tensor("op_7509_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7509_cast_fp16 = einsum(equation = var_7509_equation_0, values = (var_7339_cast_fp16, var_7483_cast_fp16))[name = tensor("op_7509_cast_fp16")]; + tensor var_7511_equation_0 = const()[name = tensor("op_7511_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7511_cast_fp16 = einsum(equation = var_7511_equation_0, values = (var_7343_cast_fp16, var_7484_cast_fp16))[name = tensor("op_7511_cast_fp16")]; + tensor var_7513_equation_0 = const()[name = tensor("op_7513_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7513_cast_fp16 = einsum(equation = var_7513_equation_0, values = (var_7347_cast_fp16, var_7485_cast_fp16))[name = tensor("op_7513_cast_fp16")]; + tensor var_7515_equation_0 = const()[name = tensor("op_7515_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7515_cast_fp16 = einsum(equation = var_7515_equation_0, values = (var_7351_cast_fp16, var_7486_cast_fp16))[name = tensor("op_7515_cast_fp16")]; + tensor var_7517_equation_0 = const()[name = tensor("op_7517_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7517_cast_fp16 = einsum(equation = var_7517_equation_0, values = (var_7355_cast_fp16, var_7487_cast_fp16))[name = tensor("op_7517_cast_fp16")]; + tensor var_7519_equation_0 = const()[name = tensor("op_7519_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7519_cast_fp16 = einsum(equation = var_7519_equation_0, values = (var_7359_cast_fp16, var_7488_cast_fp16))[name = tensor("op_7519_cast_fp16")]; + tensor var_7521_equation_0 = const()[name = tensor("op_7521_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7521_cast_fp16 = einsum(equation = var_7521_equation_0, values = (var_7363_cast_fp16, var_7489_cast_fp16))[name = tensor("op_7521_cast_fp16")]; + tensor var_7523_equation_0 = const()[name = tensor("op_7523_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7523_cast_fp16 = einsum(equation = var_7523_equation_0, values = (var_7367_cast_fp16, var_7490_cast_fp16))[name = tensor("op_7523_cast_fp16")]; + tensor var_7525_equation_0 = const()[name = tensor("op_7525_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7525_cast_fp16 = einsum(equation = var_7525_equation_0, values = (var_7371_cast_fp16, var_7491_cast_fp16))[name = tensor("op_7525_cast_fp16")]; + tensor var_7527_equation_0 = const()[name = tensor("op_7527_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7527_cast_fp16 = einsum(equation = var_7527_equation_0, values = (var_7375_cast_fp16, var_7492_cast_fp16))[name = tensor("op_7527_cast_fp16")]; + tensor var_7529_equation_0 = const()[name = tensor("op_7529_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7529_cast_fp16 = einsum(equation = var_7529_equation_0, values = (var_7379_cast_fp16, var_7493_cast_fp16))[name = tensor("op_7529_cast_fp16")]; + tensor var_7531_equation_0 = const()[name = tensor("op_7531_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7531_cast_fp16 = einsum(equation = var_7531_equation_0, values = (var_7383_cast_fp16, var_7494_cast_fp16))[name = tensor("op_7531_cast_fp16")]; + tensor var_7533_equation_0 = const()[name = tensor("op_7533_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7533_cast_fp16 = einsum(equation = var_7533_equation_0, values = (var_7387_cast_fp16, var_7495_cast_fp16))[name = tensor("op_7533_cast_fp16")]; + tensor var_7535_equation_0 = const()[name = tensor("op_7535_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7535_cast_fp16 = einsum(equation = var_7535_equation_0, values = (var_7391_cast_fp16, var_7496_cast_fp16))[name = tensor("op_7535_cast_fp16")]; + tensor var_7537_equation_0 = const()[name = tensor("op_7537_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_7537_cast_fp16 = einsum(equation = var_7537_equation_0, values = (var_7395_cast_fp16, var_7497_cast_fp16))[name = tensor("op_7537_cast_fp16")]; + tensor input_329_interleave_0 = const()[name = tensor("input_329_interleave_0"), val = tensor(false)]; + tensor input_329_cast_fp16 = concat(axis = var_5599, interleave = input_329_interleave_0, values = (var_7499_cast_fp16, var_7501_cast_fp16, var_7503_cast_fp16, var_7505_cast_fp16, var_7507_cast_fp16, var_7509_cast_fp16, var_7511_cast_fp16, var_7513_cast_fp16, var_7515_cast_fp16, var_7517_cast_fp16, var_7519_cast_fp16, var_7521_cast_fp16, var_7523_cast_fp16, var_7525_cast_fp16, var_7527_cast_fp16, var_7529_cast_fp16, var_7531_cast_fp16, var_7533_cast_fp16, var_7535_cast_fp16, var_7537_cast_fp16))[name = tensor("input_329_cast_fp16")]; + tensor var_7543 = const()[name = tensor("op_7543"), val = tensor([1, 1])]; + tensor var_7545 = const()[name = tensor("op_7545"), val = tensor([1, 1])]; + tensor var_7547_pad_type_0 = const()[name = tensor("op_7547_pad_type_0"), val = tensor("custom")]; + tensor var_7547_pad_0 = const()[name = tensor("op_7547_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1320268608)))]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1323545472)))]; + tensor var_7547_cast_fp16 = conv(bias = up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_7545, groups = var_5599, pad = var_7547_pad_0, pad_type = var_7547_pad_type_0, strides = var_7543, weight = up_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_329_cast_fp16)[name = tensor("op_7547_cast_fp16")]; + tensor inputs_53_cast_fp16 = add(x = var_7547_cast_fp16, y = inputs_51_cast_fp16)[name = tensor("inputs_53_cast_fp16")]; + tensor var_7551 = const()[name = tensor("op_7551"), val = tensor([1])]; + tensor channels_mean_53_cast_fp16 = reduce_mean(axes = var_7551, keep_dims = var_5594, x = inputs_53_cast_fp16)[name = tensor("channels_mean_53_cast_fp16")]; + tensor zero_mean_53_cast_fp16 = sub(x = inputs_53_cast_fp16, y = channels_mean_53_cast_fp16)[name = tensor("zero_mean_53_cast_fp16")]; + tensor zero_mean_sq_53_cast_fp16 = mul(x = zero_mean_53_cast_fp16, y = zero_mean_53_cast_fp16)[name = tensor("zero_mean_sq_53_cast_fp16")]; + tensor var_7555 = const()[name = tensor("op_7555"), val = tensor([1])]; + tensor var_7556_cast_fp16 = reduce_mean(axes = var_7555, keep_dims = var_5594, x = zero_mean_sq_53_cast_fp16)[name = tensor("op_7556_cast_fp16")]; + tensor var_7557_to_fp16 = const()[name = tensor("op_7557_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_7558_cast_fp16 = add(x = var_7556_cast_fp16, y = var_7557_to_fp16)[name = tensor("op_7558_cast_fp16")]; + tensor denom_53_epsilon_0_to_fp16 = const()[name = tensor("denom_53_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_53_cast_fp16 = rsqrt(epsilon = denom_53_epsilon_0_to_fp16, x = var_7558_cast_fp16)[name = tensor("denom_53_cast_fp16")]; + tensor out_53_cast_fp16 = mul(x = zero_mean_53_cast_fp16, y = denom_53_cast_fp16)[name = tensor("out_53_cast_fp16")]; + tensor var_7562_to_fp16 = const()[name = tensor("op_7562_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1323548096)))]; + tensor var_7563_cast_fp16 = add(x = out_53_cast_fp16, y = var_7562_to_fp16)[name = tensor("op_7563_cast_fp16")]; + tensor var_7565_to_fp16 = const()[name = tensor("op_7565_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1323550720)))]; + tensor input_331_cast_fp16 = mul(x = var_7563_cast_fp16, y = var_7565_to_fp16)[name = tensor("input_331_cast_fp16")]; + tensor var_7573 = const()[name = tensor("op_7573"), val = tensor([1, 1])]; + tensor var_7575 = const()[name = tensor("op_7575"), val = tensor([1, 1])]; + tensor var_7577_pad_type_0 = const()[name = tensor("op_7577_pad_type_0"), val = tensor("custom")]; + tensor var_7577_pad_0 = const()[name = tensor("op_7577_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1323553344)))]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1349767808)))]; + tensor var_7577_cast_fp16 = conv(bias = up_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_7575, groups = var_5599, pad = var_7577_pad_0, pad_type = var_7577_pad_type_0, strides = var_7573, weight = up_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_331_cast_fp16)[name = tensor("op_7577_cast_fp16")]; + tensor var_7578_split_sizes_0 = const()[name = tensor("op_7578_split_sizes_0"), val = tensor([5120, 5120])]; + tensor var_7578_axis_0 = const()[name = tensor("op_7578_axis_0"), val = tensor(1)]; + tensor var_7578_cast_fp16_0, tensor var_7578_cast_fp16_1 = split(axis = var_7578_axis_0, split_sizes = var_7578_split_sizes_0, x = var_7577_cast_fp16)[name = tensor("op_7578_cast_fp16")]; + tensor var_7580_mode_0 = const()[name = tensor("op_7580_mode_0"), val = tensor("EXACT")]; + tensor var_7580_cast_fp16 = gelu(mode = var_7580_mode_0, x = var_7578_cast_fp16_1)[name = tensor("op_7580_cast_fp16")]; + tensor input_333_cast_fp16 = mul(x = var_7578_cast_fp16_0, y = var_7580_cast_fp16)[name = tensor("input_333_cast_fp16")]; + tensor var_7584 = const()[name = tensor("op_7584"), val = tensor([1, 1])]; + tensor var_7586 = const()[name = tensor("op_7586"), val = tensor([1, 1])]; + tensor var_7588_pad_type_0 = const()[name = tensor("op_7588_pad_type_0"), val = tensor("custom")]; + tensor var_7588_pad_0 = const()[name = tensor("op_7588_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1349788352)))]; + tensor up_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1362895616)))]; + tensor var_7588_cast_fp16 = conv(bias = up_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_7586, groups = var_5599, pad = var_7588_pad_0, pad_type = var_7588_pad_type_0, strides = var_7584, weight = up_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_333_cast_fp16)[name = tensor("op_7588_cast_fp16")]; + tensor hidden_states_193_cast_fp16 = add(x = var_7588_cast_fp16, y = inputs_53_cast_fp16)[name = tensor("hidden_states_193_cast_fp16")]; + tensor var_7590 = const()[name = tensor("op_7590"), val = tensor([2, 1280, 12, 12])]; + tensor input_335_cast_fp16 = reshape(shape = var_7590, x = hidden_states_193_cast_fp16)[name = tensor("input_335_cast_fp16")]; + tensor var_7594 = const()[name = tensor("op_7594"), val = tensor([1, 1])]; + tensor var_7596 = const()[name = tensor("op_7596"), val = tensor([1, 1])]; + tensor hidden_states_195_pad_type_0 = const()[name = tensor("hidden_states_195_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_195_pad_0 = const()[name = tensor("hidden_states_195_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_1_proj_out_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1362898240)))]; + tensor up_blocks_1_attentions_1_proj_out_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_1_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1366175104)))]; + tensor hidden_states_195_cast_fp16 = conv(bias = up_blocks_1_attentions_1_proj_out_bias_to_fp16, dilations = var_7596, groups = var_5599, pad = hidden_states_195_pad_0, pad_type = hidden_states_195_pad_type_0, strides = var_7594, weight = up_blocks_1_attentions_1_proj_out_weight_to_fp16, x = input_335_cast_fp16)[name = tensor("hidden_states_195_cast_fp16")]; + tensor hidden_states_197_cast_fp16 = add(x = hidden_states_195_cast_fp16, y = hidden_states_183_cast_fp16)[name = tensor("hidden_states_197_cast_fp16")]; + tensor input_337_interleave_0 = const()[name = tensor("input_337_interleave_0"), val = tensor(false)]; + tensor input_337_cast_fp16 = concat(axis = var_5599, interleave = input_337_interleave_0, values = (hidden_states_197_cast_fp16, input_117_cast_fp16))[name = tensor("input_337_cast_fp16")]; + tensor reshape_156_shape_0 = const()[name = tensor("reshape_156_shape_0"), val = tensor([2, 32, 60, 12, 12])]; + tensor reshape_156_cast_fp16 = reshape(shape = reshape_156_shape_0, x = input_337_cast_fp16)[name = tensor("reshape_156_cast_fp16")]; + tensor reduce_mean_117_axes_0 = const()[name = tensor("reduce_mean_117_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_117_keep_dims_0 = const()[name = tensor("reduce_mean_117_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_117_cast_fp16 = reduce_mean(axes = reduce_mean_117_axes_0, keep_dims = reduce_mean_117_keep_dims_0, x = reshape_156_cast_fp16)[name = tensor("reduce_mean_117_cast_fp16")]; + tensor sub_78_cast_fp16 = sub(x = reshape_156_cast_fp16, y = reduce_mean_117_cast_fp16)[name = tensor("sub_78_cast_fp16")]; + tensor square_39_cast_fp16 = square(x = sub_78_cast_fp16)[name = tensor("square_39_cast_fp16")]; + tensor reduce_mean_119_axes_0 = const()[name = tensor("reduce_mean_119_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_119_keep_dims_0 = const()[name = tensor("reduce_mean_119_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_119_cast_fp16 = reduce_mean(axes = reduce_mean_119_axes_0, keep_dims = reduce_mean_119_keep_dims_0, x = square_39_cast_fp16)[name = tensor("reduce_mean_119_cast_fp16")]; + tensor add_78_y_0_to_fp16 = const()[name = tensor("add_78_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_78_cast_fp16 = add(x = reduce_mean_119_cast_fp16, y = add_78_y_0_to_fp16)[name = tensor("add_78_cast_fp16")]; + tensor sqrt_39_cast_fp16 = sqrt(x = add_78_cast_fp16)[name = tensor("sqrt_39_cast_fp16")]; + tensor real_div_39_cast_fp16 = real_div(x = sub_78_cast_fp16, y = sqrt_39_cast_fp16)[name = tensor("real_div_39_cast_fp16")]; + tensor reshape_157_shape_0 = const()[name = tensor("reshape_157_shape_0"), val = tensor([2, 1920, 12, 12])]; + tensor reshape_157_cast_fp16 = reshape(shape = reshape_157_shape_0, x = real_div_39_cast_fp16)[name = tensor("reshape_157_cast_fp16")]; + tensor add_79_mean_0_to_fp16 = const()[name = tensor("add_79_mean_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1366177728)))]; + tensor add_79_variance_0_to_fp16 = const()[name = tensor("add_79_variance_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1366181632)))]; + tensor add_79_gamma_0_to_fp16 = const()[name = tensor("add_79_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1366185536)))]; + tensor add_79_beta_0_to_fp16 = const()[name = tensor("add_79_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1366189440)))]; + tensor add_79_epsilon_0_to_fp16 = const()[name = tensor("add_79_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_79_cast_fp16 = batch_norm(beta = add_79_beta_0_to_fp16, epsilon = add_79_epsilon_0_to_fp16, gamma = add_79_gamma_0_to_fp16, mean = add_79_mean_0_to_fp16, variance = add_79_variance_0_to_fp16, x = reshape_157_cast_fp16)[name = tensor("add_79_cast_fp16")]; + tensor input_341_cast_fp16 = silu(x = add_79_cast_fp16)[name = tensor("input_341_cast_fp16")]; + tensor var_7614 = const()[name = tensor("op_7614"), val = tensor([1, 1])]; + tensor var_7616 = const()[name = tensor("op_7616"), val = tensor([1, 1])]; + tensor hidden_states_199_pad_type_0 = const()[name = tensor("hidden_states_199_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_199_pad_0 = const()[name = tensor("hidden_states_199_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_1_resnets_2_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_2_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1366193344)))]; + tensor up_blocks_1_resnets_2_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_2_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1410430208)))]; + tensor hidden_states_199_cast_fp16 = conv(bias = up_blocks_1_resnets_2_conv1_bias_to_fp16, dilations = var_7616, groups = var_5599, pad = hidden_states_199_pad_0, pad_type = hidden_states_199_pad_type_0, strides = var_7614, weight = up_blocks_1_resnets_2_conv1_weight_to_fp16, x = input_341_cast_fp16)[name = tensor("hidden_states_199_cast_fp16")]; + tensor var_7622 = const()[name = tensor("op_7622"), val = tensor([1, 1])]; + tensor var_7624 = const()[name = tensor("op_7624"), val = tensor([1, 1])]; + tensor temb_31_pad_type_0 = const()[name = tensor("temb_31_pad_type_0"), val = tensor("custom")]; + tensor temb_31_pad_0 = const()[name = tensor("temb_31_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_resnets_2_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_2_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1410432832)))]; + tensor up_blocks_1_resnets_2_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_2_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1413709696)))]; + tensor temb_31_cast_fp16 = conv(bias = up_blocks_1_resnets_2_time_emb_proj_bias_to_fp16, dilations = var_7624, groups = var_5599, pad = temb_31_pad_0, pad_type = temb_31_pad_type_0, strides = var_7622, weight = up_blocks_1_resnets_2_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_31_cast_fp16")]; + tensor input_345_cast_fp16 = add(x = hidden_states_199_cast_fp16, y = temb_31_cast_fp16)[name = tensor("input_345_cast_fp16")]; + tensor reshape_160_shape_0 = const()[name = tensor("reshape_160_shape_0"), val = tensor([2, 32, 40, 12, 12])]; + tensor reshape_160_cast_fp16 = reshape(shape = reshape_160_shape_0, x = input_345_cast_fp16)[name = tensor("reshape_160_cast_fp16")]; + tensor reduce_mean_120_axes_0 = const()[name = tensor("reduce_mean_120_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_120_keep_dims_0 = const()[name = tensor("reduce_mean_120_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_120_cast_fp16 = reduce_mean(axes = reduce_mean_120_axes_0, keep_dims = reduce_mean_120_keep_dims_0, x = reshape_160_cast_fp16)[name = tensor("reduce_mean_120_cast_fp16")]; + tensor sub_80_cast_fp16 = sub(x = reshape_160_cast_fp16, y = reduce_mean_120_cast_fp16)[name = tensor("sub_80_cast_fp16")]; + tensor square_40_cast_fp16 = square(x = sub_80_cast_fp16)[name = tensor("square_40_cast_fp16")]; + tensor reduce_mean_122_axes_0 = const()[name = tensor("reduce_mean_122_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_122_keep_dims_0 = const()[name = tensor("reduce_mean_122_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_122_cast_fp16 = reduce_mean(axes = reduce_mean_122_axes_0, keep_dims = reduce_mean_122_keep_dims_0, x = square_40_cast_fp16)[name = tensor("reduce_mean_122_cast_fp16")]; + tensor add_80_y_0_to_fp16 = const()[name = tensor("add_80_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_80_cast_fp16 = add(x = reduce_mean_122_cast_fp16, y = add_80_y_0_to_fp16)[name = tensor("add_80_cast_fp16")]; + tensor sqrt_40_cast_fp16 = sqrt(x = add_80_cast_fp16)[name = tensor("sqrt_40_cast_fp16")]; + tensor real_div_40_cast_fp16 = real_div(x = sub_80_cast_fp16, y = sqrt_40_cast_fp16)[name = tensor("real_div_40_cast_fp16")]; + tensor reshape_161_shape_0 = const()[name = tensor("reshape_161_shape_0"), val = tensor([2, 1280, 12, 12])]; + tensor reshape_161_cast_fp16 = reshape(shape = reshape_161_shape_0, x = real_div_40_cast_fp16)[name = tensor("reshape_161_cast_fp16")]; + tensor add_81_gamma_0_to_fp16 = const()[name = tensor("add_81_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1413712320)))]; + tensor add_81_beta_0_to_fp16 = const()[name = tensor("add_81_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1413714944)))]; + tensor add_81_epsilon_0_to_fp16 = const()[name = tensor("add_81_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_81_cast_fp16 = batch_norm(beta = add_81_beta_0_to_fp16, epsilon = add_81_epsilon_0_to_fp16, gamma = add_81_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_161_cast_fp16)[name = tensor("add_81_cast_fp16")]; + tensor input_349_cast_fp16 = silu(x = add_81_cast_fp16)[name = tensor("input_349_cast_fp16")]; + tensor var_7634 = const()[name = tensor("op_7634"), val = tensor([1, 1])]; + tensor var_7636 = const()[name = tensor("op_7636"), val = tensor([1, 1])]; + tensor hidden_states_201_pad_type_0 = const()[name = tensor("hidden_states_201_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_201_pad_0 = const()[name = tensor("hidden_states_201_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_1_resnets_2_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_2_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1413717568)))]; + tensor up_blocks_1_resnets_2_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_2_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1443208832)))]; + tensor hidden_states_201_cast_fp16 = conv(bias = up_blocks_1_resnets_2_conv2_bias_to_fp16, dilations = var_7636, groups = var_5599, pad = hidden_states_201_pad_0, pad_type = hidden_states_201_pad_type_0, strides = var_7634, weight = up_blocks_1_resnets_2_conv2_weight_to_fp16, x = input_349_cast_fp16)[name = tensor("hidden_states_201_cast_fp16")]; + tensor var_7641 = const()[name = tensor("op_7641"), val = tensor([1, 1])]; + tensor var_7643 = const()[name = tensor("op_7643"), val = tensor([1, 1])]; + tensor x_15_pad_type_0 = const()[name = tensor("x_15_pad_type_0"), val = tensor("custom")]; + tensor x_15_pad_0 = const()[name = tensor("x_15_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_resnets_2_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_1_resnets_2_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1443211456)))]; + tensor up_blocks_1_resnets_2_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_1_resnets_2_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1448126720)))]; + tensor x_15_cast_fp16 = conv(bias = up_blocks_1_resnets_2_conv_shortcut_bias_to_fp16, dilations = var_7643, groups = var_5599, pad = x_15_pad_0, pad_type = x_15_pad_type_0, strides = var_7641, weight = up_blocks_1_resnets_2_conv_shortcut_weight_to_fp16, x = input_337_cast_fp16)[name = tensor("x_15_cast_fp16")]; + tensor hidden_states_203_cast_fp16 = add(x = x_15_cast_fp16, y = hidden_states_201_cast_fp16)[name = tensor("hidden_states_203_cast_fp16")]; + tensor reshape_164_shape_0 = const()[name = tensor("reshape_164_shape_0"), val = tensor([2, 32, 40, 12, 12])]; + tensor reshape_164_cast_fp16 = reshape(shape = reshape_164_shape_0, x = hidden_states_203_cast_fp16)[name = tensor("reshape_164_cast_fp16")]; + tensor reduce_mean_123_axes_0 = const()[name = tensor("reduce_mean_123_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_123_keep_dims_0 = const()[name = tensor("reduce_mean_123_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_123_cast_fp16 = reduce_mean(axes = reduce_mean_123_axes_0, keep_dims = reduce_mean_123_keep_dims_0, x = reshape_164_cast_fp16)[name = tensor("reduce_mean_123_cast_fp16")]; + tensor sub_82_cast_fp16 = sub(x = reshape_164_cast_fp16, y = reduce_mean_123_cast_fp16)[name = tensor("sub_82_cast_fp16")]; + tensor square_41_cast_fp16 = square(x = sub_82_cast_fp16)[name = tensor("square_41_cast_fp16")]; + tensor reduce_mean_125_axes_0 = const()[name = tensor("reduce_mean_125_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_125_keep_dims_0 = const()[name = tensor("reduce_mean_125_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_125_cast_fp16 = reduce_mean(axes = reduce_mean_125_axes_0, keep_dims = reduce_mean_125_keep_dims_0, x = square_41_cast_fp16)[name = tensor("reduce_mean_125_cast_fp16")]; + tensor add_82_y_0_to_fp16 = const()[name = tensor("add_82_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_82_cast_fp16 = add(x = reduce_mean_125_cast_fp16, y = add_82_y_0_to_fp16)[name = tensor("add_82_cast_fp16")]; + tensor sqrt_41_cast_fp16 = sqrt(x = add_82_cast_fp16)[name = tensor("sqrt_41_cast_fp16")]; + tensor real_div_41_cast_fp16 = real_div(x = sub_82_cast_fp16, y = sqrt_41_cast_fp16)[name = tensor("real_div_41_cast_fp16")]; + tensor reshape_165_shape_0 = const()[name = tensor("reshape_165_shape_0"), val = tensor([2, 1280, 12, 12])]; + tensor reshape_165_cast_fp16 = reshape(shape = reshape_165_shape_0, x = real_div_41_cast_fp16)[name = tensor("reshape_165_cast_fp16")]; + tensor add_83_gamma_0_to_fp16 = const()[name = tensor("add_83_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1448129344)))]; + tensor add_83_beta_0_to_fp16 = const()[name = tensor("add_83_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1448131968)))]; + tensor add_83_epsilon_0_to_fp16 = const()[name = tensor("add_83_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_83_cast_fp16 = batch_norm(beta = add_83_beta_0_to_fp16, epsilon = add_83_epsilon_0_to_fp16, gamma = add_83_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_165_cast_fp16)[name = tensor("add_83_cast_fp16")]; + tensor var_7663 = const()[name = tensor("op_7663"), val = tensor([1, 1])]; + tensor var_7665 = const()[name = tensor("op_7665"), val = tensor([1, 1])]; + tensor hidden_states_205_pad_type_0 = const()[name = tensor("hidden_states_205_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_205_pad_0 = const()[name = tensor("hidden_states_205_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_proj_in_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1448134592)))]; + tensor up_blocks_1_attentions_2_proj_in_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1451411456)))]; + tensor hidden_states_205_cast_fp16 = conv(bias = up_blocks_1_attentions_2_proj_in_bias_to_fp16, dilations = var_7665, groups = var_5599, pad = hidden_states_205_pad_0, pad_type = hidden_states_205_pad_type_0, strides = var_7663, weight = up_blocks_1_attentions_2_proj_in_weight_to_fp16, x = add_83_cast_fp16)[name = tensor("hidden_states_205_cast_fp16")]; + tensor var_7670 = const()[name = tensor("op_7670"), val = tensor([2, 1280, 1, 144])]; + tensor inputs_55_cast_fp16 = reshape(shape = var_7670, x = hidden_states_205_cast_fp16)[name = tensor("inputs_55_cast_fp16")]; + tensor var_7680 = const()[name = tensor("op_7680"), val = tensor([1])]; + tensor channels_mean_55_cast_fp16 = reduce_mean(axes = var_7680, keep_dims = var_5594, x = inputs_55_cast_fp16)[name = tensor("channels_mean_55_cast_fp16")]; + tensor zero_mean_55_cast_fp16 = sub(x = inputs_55_cast_fp16, y = channels_mean_55_cast_fp16)[name = tensor("zero_mean_55_cast_fp16")]; + tensor zero_mean_sq_55_cast_fp16 = mul(x = zero_mean_55_cast_fp16, y = zero_mean_55_cast_fp16)[name = tensor("zero_mean_sq_55_cast_fp16")]; + tensor var_7684 = const()[name = tensor("op_7684"), val = tensor([1])]; + tensor var_7685_cast_fp16 = reduce_mean(axes = var_7684, keep_dims = var_5594, x = zero_mean_sq_55_cast_fp16)[name = tensor("op_7685_cast_fp16")]; + tensor var_7686_to_fp16 = const()[name = tensor("op_7686_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_7687_cast_fp16 = add(x = var_7685_cast_fp16, y = var_7686_to_fp16)[name = tensor("op_7687_cast_fp16")]; + tensor denom_55_epsilon_0_to_fp16 = const()[name = tensor("denom_55_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_55_cast_fp16 = rsqrt(epsilon = denom_55_epsilon_0_to_fp16, x = var_7687_cast_fp16)[name = tensor("denom_55_cast_fp16")]; + tensor out_55_cast_fp16 = mul(x = zero_mean_55_cast_fp16, y = denom_55_cast_fp16)[name = tensor("out_55_cast_fp16")]; + tensor var_7691_to_fp16 = const()[name = tensor("op_7691_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1451414080)))]; + tensor var_7692_cast_fp16 = add(x = out_55_cast_fp16, y = var_7691_to_fp16)[name = tensor("op_7692_cast_fp16")]; + tensor var_7694_to_fp16 = const()[name = tensor("op_7694_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1451416704)))]; + tensor hidden_states_207_cast_fp16 = mul(x = var_7692_cast_fp16, y = var_7694_to_fp16)[name = tensor("hidden_states_207_cast_fp16")]; + tensor var_7701 = const()[name = tensor("op_7701"), val = tensor([1, 1])]; + tensor var_7703 = const()[name = tensor("op_7703"), val = tensor([1, 1])]; + tensor q_37_pad_type_0 = const()[name = tensor("q_37_pad_type_0"), val = tensor("custom")]; + tensor q_37_pad_0 = const()[name = tensor("q_37_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1451419328)))]; + tensor q_37_cast_fp16 = conv(dilations = var_7703, groups = var_5599, pad = q_37_pad_0, pad_type = q_37_pad_type_0, strides = var_7701, weight = up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_207_cast_fp16)[name = tensor("q_37_cast_fp16")]; + tensor var_7707 = const()[name = tensor("op_7707"), val = tensor([1, 1])]; + tensor var_7709 = const()[name = tensor("op_7709"), val = tensor([1, 1])]; + tensor k_73_pad_type_0 = const()[name = tensor("k_73_pad_type_0"), val = tensor("custom")]; + tensor k_73_pad_0 = const()[name = tensor("k_73_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1454696192)))]; + tensor k_73_cast_fp16 = conv(dilations = var_7709, groups = var_5599, pad = k_73_pad_0, pad_type = k_73_pad_type_0, strides = var_7707, weight = up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_207_cast_fp16)[name = tensor("k_73_cast_fp16")]; + tensor var_7713 = const()[name = tensor("op_7713"), val = tensor([1, 1])]; + tensor var_7715 = const()[name = tensor("op_7715"), val = tensor([1, 1])]; + tensor v_37_pad_type_0 = const()[name = tensor("v_37_pad_type_0"), val = tensor("custom")]; + tensor v_37_pad_0 = const()[name = tensor("v_37_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1457973056)))]; + tensor v_37_cast_fp16 = conv(dilations = var_7715, groups = var_5599, pad = v_37_pad_0, pad_type = v_37_pad_type_0, strides = var_7713, weight = up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_207_cast_fp16)[name = tensor("v_37_cast_fp16")]; + tensor var_7719_begin_0 = const()[name = tensor("op_7719_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_7719_end_0 = const()[name = tensor("op_7719_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_7719_end_mask_0 = const()[name = tensor("op_7719_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7719_cast_fp16 = slice_by_index(begin = var_7719_begin_0, end = var_7719_end_0, end_mask = var_7719_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7719_cast_fp16")]; + tensor var_7723_begin_0 = const()[name = tensor("op_7723_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_7723_end_0 = const()[name = tensor("op_7723_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_7723_end_mask_0 = const()[name = tensor("op_7723_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7723_cast_fp16 = slice_by_index(begin = var_7723_begin_0, end = var_7723_end_0, end_mask = var_7723_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7723_cast_fp16")]; + tensor var_7727_begin_0 = const()[name = tensor("op_7727_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_7727_end_0 = const()[name = tensor("op_7727_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_7727_end_mask_0 = const()[name = tensor("op_7727_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7727_cast_fp16 = slice_by_index(begin = var_7727_begin_0, end = var_7727_end_0, end_mask = var_7727_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7727_cast_fp16")]; + tensor var_7731_begin_0 = const()[name = tensor("op_7731_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_7731_end_0 = const()[name = tensor("op_7731_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_7731_end_mask_0 = const()[name = tensor("op_7731_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7731_cast_fp16 = slice_by_index(begin = var_7731_begin_0, end = var_7731_end_0, end_mask = var_7731_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7731_cast_fp16")]; + tensor var_7735_begin_0 = const()[name = tensor("op_7735_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_7735_end_0 = const()[name = tensor("op_7735_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_7735_end_mask_0 = const()[name = tensor("op_7735_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7735_cast_fp16 = slice_by_index(begin = var_7735_begin_0, end = var_7735_end_0, end_mask = var_7735_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7735_cast_fp16")]; + tensor var_7739_begin_0 = const()[name = tensor("op_7739_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_7739_end_0 = const()[name = tensor("op_7739_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_7739_end_mask_0 = const()[name = tensor("op_7739_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7739_cast_fp16 = slice_by_index(begin = var_7739_begin_0, end = var_7739_end_0, end_mask = var_7739_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7739_cast_fp16")]; + tensor var_7743_begin_0 = const()[name = tensor("op_7743_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_7743_end_0 = const()[name = tensor("op_7743_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_7743_end_mask_0 = const()[name = tensor("op_7743_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7743_cast_fp16 = slice_by_index(begin = var_7743_begin_0, end = var_7743_end_0, end_mask = var_7743_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7743_cast_fp16")]; + tensor var_7747_begin_0 = const()[name = tensor("op_7747_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_7747_end_0 = const()[name = tensor("op_7747_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_7747_end_mask_0 = const()[name = tensor("op_7747_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7747_cast_fp16 = slice_by_index(begin = var_7747_begin_0, end = var_7747_end_0, end_mask = var_7747_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7747_cast_fp16")]; + tensor var_7751_begin_0 = const()[name = tensor("op_7751_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_7751_end_0 = const()[name = tensor("op_7751_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_7751_end_mask_0 = const()[name = tensor("op_7751_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7751_cast_fp16 = slice_by_index(begin = var_7751_begin_0, end = var_7751_end_0, end_mask = var_7751_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7751_cast_fp16")]; + tensor var_7755_begin_0 = const()[name = tensor("op_7755_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_7755_end_0 = const()[name = tensor("op_7755_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_7755_end_mask_0 = const()[name = tensor("op_7755_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7755_cast_fp16 = slice_by_index(begin = var_7755_begin_0, end = var_7755_end_0, end_mask = var_7755_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7755_cast_fp16")]; + tensor var_7759_begin_0 = const()[name = tensor("op_7759_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_7759_end_0 = const()[name = tensor("op_7759_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_7759_end_mask_0 = const()[name = tensor("op_7759_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7759_cast_fp16 = slice_by_index(begin = var_7759_begin_0, end = var_7759_end_0, end_mask = var_7759_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7759_cast_fp16")]; + tensor var_7763_begin_0 = const()[name = tensor("op_7763_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_7763_end_0 = const()[name = tensor("op_7763_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_7763_end_mask_0 = const()[name = tensor("op_7763_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7763_cast_fp16 = slice_by_index(begin = var_7763_begin_0, end = var_7763_end_0, end_mask = var_7763_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7763_cast_fp16")]; + tensor var_7767_begin_0 = const()[name = tensor("op_7767_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_7767_end_0 = const()[name = tensor("op_7767_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_7767_end_mask_0 = const()[name = tensor("op_7767_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7767_cast_fp16 = slice_by_index(begin = var_7767_begin_0, end = var_7767_end_0, end_mask = var_7767_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7767_cast_fp16")]; + tensor var_7771_begin_0 = const()[name = tensor("op_7771_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_7771_end_0 = const()[name = tensor("op_7771_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_7771_end_mask_0 = const()[name = tensor("op_7771_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7771_cast_fp16 = slice_by_index(begin = var_7771_begin_0, end = var_7771_end_0, end_mask = var_7771_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7771_cast_fp16")]; + tensor var_7775_begin_0 = const()[name = tensor("op_7775_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_7775_end_0 = const()[name = tensor("op_7775_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_7775_end_mask_0 = const()[name = tensor("op_7775_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7775_cast_fp16 = slice_by_index(begin = var_7775_begin_0, end = var_7775_end_0, end_mask = var_7775_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7775_cast_fp16")]; + tensor var_7779_begin_0 = const()[name = tensor("op_7779_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_7779_end_0 = const()[name = tensor("op_7779_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_7779_end_mask_0 = const()[name = tensor("op_7779_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7779_cast_fp16 = slice_by_index(begin = var_7779_begin_0, end = var_7779_end_0, end_mask = var_7779_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7779_cast_fp16")]; + tensor var_7783_begin_0 = const()[name = tensor("op_7783_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_7783_end_0 = const()[name = tensor("op_7783_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_7783_end_mask_0 = const()[name = tensor("op_7783_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7783_cast_fp16 = slice_by_index(begin = var_7783_begin_0, end = var_7783_end_0, end_mask = var_7783_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7783_cast_fp16")]; + tensor var_7787_begin_0 = const()[name = tensor("op_7787_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_7787_end_0 = const()[name = tensor("op_7787_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_7787_end_mask_0 = const()[name = tensor("op_7787_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7787_cast_fp16 = slice_by_index(begin = var_7787_begin_0, end = var_7787_end_0, end_mask = var_7787_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7787_cast_fp16")]; + tensor var_7791_begin_0 = const()[name = tensor("op_7791_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_7791_end_0 = const()[name = tensor("op_7791_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_7791_end_mask_0 = const()[name = tensor("op_7791_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7791_cast_fp16 = slice_by_index(begin = var_7791_begin_0, end = var_7791_end_0, end_mask = var_7791_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7791_cast_fp16")]; + tensor var_7795_begin_0 = const()[name = tensor("op_7795_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_7795_end_0 = const()[name = tensor("op_7795_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_7795_end_mask_0 = const()[name = tensor("op_7795_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7795_cast_fp16 = slice_by_index(begin = var_7795_begin_0, end = var_7795_end_0, end_mask = var_7795_end_mask_0, x = q_37_cast_fp16)[name = tensor("op_7795_cast_fp16")]; + tensor k_75_perm_0 = const()[name = tensor("k_75_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_7802_begin_0 = const()[name = tensor("op_7802_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_7802_end_0 = const()[name = tensor("op_7802_end_0"), val = tensor([2, 144, 1, 64])]; + tensor var_7802_end_mask_0 = const()[name = tensor("op_7802_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_13 = transpose(perm = k_75_perm_0, x = k_73_cast_fp16)[name = tensor("transpose_13")]; + tensor var_7802_cast_fp16 = slice_by_index(begin = var_7802_begin_0, end = var_7802_end_0, end_mask = var_7802_end_mask_0, x = transpose_13)[name = tensor("op_7802_cast_fp16")]; + tensor var_7806_begin_0 = const()[name = tensor("op_7806_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_7806_end_0 = const()[name = tensor("op_7806_end_0"), val = tensor([2, 144, 1, 128])]; + tensor var_7806_end_mask_0 = const()[name = tensor("op_7806_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7806_cast_fp16 = slice_by_index(begin = var_7806_begin_0, end = var_7806_end_0, end_mask = var_7806_end_mask_0, x = transpose_13)[name = tensor("op_7806_cast_fp16")]; + tensor var_7810_begin_0 = const()[name = tensor("op_7810_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_7810_end_0 = const()[name = tensor("op_7810_end_0"), val = tensor([2, 144, 1, 192])]; + tensor var_7810_end_mask_0 = const()[name = tensor("op_7810_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7810_cast_fp16 = slice_by_index(begin = var_7810_begin_0, end = var_7810_end_0, end_mask = var_7810_end_mask_0, x = transpose_13)[name = tensor("op_7810_cast_fp16")]; + tensor var_7814_begin_0 = const()[name = tensor("op_7814_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_7814_end_0 = const()[name = tensor("op_7814_end_0"), val = tensor([2, 144, 1, 256])]; + tensor var_7814_end_mask_0 = const()[name = tensor("op_7814_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7814_cast_fp16 = slice_by_index(begin = var_7814_begin_0, end = var_7814_end_0, end_mask = var_7814_end_mask_0, x = transpose_13)[name = tensor("op_7814_cast_fp16")]; + tensor var_7818_begin_0 = const()[name = tensor("op_7818_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_7818_end_0 = const()[name = tensor("op_7818_end_0"), val = tensor([2, 144, 1, 320])]; + tensor var_7818_end_mask_0 = const()[name = tensor("op_7818_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7818_cast_fp16 = slice_by_index(begin = var_7818_begin_0, end = var_7818_end_0, end_mask = var_7818_end_mask_0, x = transpose_13)[name = tensor("op_7818_cast_fp16")]; + tensor var_7822_begin_0 = const()[name = tensor("op_7822_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_7822_end_0 = const()[name = tensor("op_7822_end_0"), val = tensor([2, 144, 1, 384])]; + tensor var_7822_end_mask_0 = const()[name = tensor("op_7822_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7822_cast_fp16 = slice_by_index(begin = var_7822_begin_0, end = var_7822_end_0, end_mask = var_7822_end_mask_0, x = transpose_13)[name = tensor("op_7822_cast_fp16")]; + tensor var_7826_begin_0 = const()[name = tensor("op_7826_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_7826_end_0 = const()[name = tensor("op_7826_end_0"), val = tensor([2, 144, 1, 448])]; + tensor var_7826_end_mask_0 = const()[name = tensor("op_7826_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7826_cast_fp16 = slice_by_index(begin = var_7826_begin_0, end = var_7826_end_0, end_mask = var_7826_end_mask_0, x = transpose_13)[name = tensor("op_7826_cast_fp16")]; + tensor var_7830_begin_0 = const()[name = tensor("op_7830_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_7830_end_0 = const()[name = tensor("op_7830_end_0"), val = tensor([2, 144, 1, 512])]; + tensor var_7830_end_mask_0 = const()[name = tensor("op_7830_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7830_cast_fp16 = slice_by_index(begin = var_7830_begin_0, end = var_7830_end_0, end_mask = var_7830_end_mask_0, x = transpose_13)[name = tensor("op_7830_cast_fp16")]; + tensor var_7834_begin_0 = const()[name = tensor("op_7834_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_7834_end_0 = const()[name = tensor("op_7834_end_0"), val = tensor([2, 144, 1, 576])]; + tensor var_7834_end_mask_0 = const()[name = tensor("op_7834_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7834_cast_fp16 = slice_by_index(begin = var_7834_begin_0, end = var_7834_end_0, end_mask = var_7834_end_mask_0, x = transpose_13)[name = tensor("op_7834_cast_fp16")]; + tensor var_7838_begin_0 = const()[name = tensor("op_7838_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_7838_end_0 = const()[name = tensor("op_7838_end_0"), val = tensor([2, 144, 1, 640])]; + tensor var_7838_end_mask_0 = const()[name = tensor("op_7838_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7838_cast_fp16 = slice_by_index(begin = var_7838_begin_0, end = var_7838_end_0, end_mask = var_7838_end_mask_0, x = transpose_13)[name = tensor("op_7838_cast_fp16")]; + tensor var_7842_begin_0 = const()[name = tensor("op_7842_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_7842_end_0 = const()[name = tensor("op_7842_end_0"), val = tensor([2, 144, 1, 704])]; + tensor var_7842_end_mask_0 = const()[name = tensor("op_7842_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7842_cast_fp16 = slice_by_index(begin = var_7842_begin_0, end = var_7842_end_0, end_mask = var_7842_end_mask_0, x = transpose_13)[name = tensor("op_7842_cast_fp16")]; + tensor var_7846_begin_0 = const()[name = tensor("op_7846_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_7846_end_0 = const()[name = tensor("op_7846_end_0"), val = tensor([2, 144, 1, 768])]; + tensor var_7846_end_mask_0 = const()[name = tensor("op_7846_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7846_cast_fp16 = slice_by_index(begin = var_7846_begin_0, end = var_7846_end_0, end_mask = var_7846_end_mask_0, x = transpose_13)[name = tensor("op_7846_cast_fp16")]; + tensor var_7850_begin_0 = const()[name = tensor("op_7850_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_7850_end_0 = const()[name = tensor("op_7850_end_0"), val = tensor([2, 144, 1, 832])]; + tensor var_7850_end_mask_0 = const()[name = tensor("op_7850_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7850_cast_fp16 = slice_by_index(begin = var_7850_begin_0, end = var_7850_end_0, end_mask = var_7850_end_mask_0, x = transpose_13)[name = tensor("op_7850_cast_fp16")]; + tensor var_7854_begin_0 = const()[name = tensor("op_7854_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_7854_end_0 = const()[name = tensor("op_7854_end_0"), val = tensor([2, 144, 1, 896])]; + tensor var_7854_end_mask_0 = const()[name = tensor("op_7854_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7854_cast_fp16 = slice_by_index(begin = var_7854_begin_0, end = var_7854_end_0, end_mask = var_7854_end_mask_0, x = transpose_13)[name = tensor("op_7854_cast_fp16")]; + tensor var_7858_begin_0 = const()[name = tensor("op_7858_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_7858_end_0 = const()[name = tensor("op_7858_end_0"), val = tensor([2, 144, 1, 960])]; + tensor var_7858_end_mask_0 = const()[name = tensor("op_7858_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7858_cast_fp16 = slice_by_index(begin = var_7858_begin_0, end = var_7858_end_0, end_mask = var_7858_end_mask_0, x = transpose_13)[name = tensor("op_7858_cast_fp16")]; + tensor var_7862_begin_0 = const()[name = tensor("op_7862_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_7862_end_0 = const()[name = tensor("op_7862_end_0"), val = tensor([2, 144, 1, 1024])]; + tensor var_7862_end_mask_0 = const()[name = tensor("op_7862_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7862_cast_fp16 = slice_by_index(begin = var_7862_begin_0, end = var_7862_end_0, end_mask = var_7862_end_mask_0, x = transpose_13)[name = tensor("op_7862_cast_fp16")]; + tensor var_7866_begin_0 = const()[name = tensor("op_7866_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_7866_end_0 = const()[name = tensor("op_7866_end_0"), val = tensor([2, 144, 1, 1088])]; + tensor var_7866_end_mask_0 = const()[name = tensor("op_7866_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7866_cast_fp16 = slice_by_index(begin = var_7866_begin_0, end = var_7866_end_0, end_mask = var_7866_end_mask_0, x = transpose_13)[name = tensor("op_7866_cast_fp16")]; + tensor var_7870_begin_0 = const()[name = tensor("op_7870_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_7870_end_0 = const()[name = tensor("op_7870_end_0"), val = tensor([2, 144, 1, 1152])]; + tensor var_7870_end_mask_0 = const()[name = tensor("op_7870_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7870_cast_fp16 = slice_by_index(begin = var_7870_begin_0, end = var_7870_end_0, end_mask = var_7870_end_mask_0, x = transpose_13)[name = tensor("op_7870_cast_fp16")]; + tensor var_7874_begin_0 = const()[name = tensor("op_7874_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_7874_end_0 = const()[name = tensor("op_7874_end_0"), val = tensor([2, 144, 1, 1216])]; + tensor var_7874_end_mask_0 = const()[name = tensor("op_7874_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7874_cast_fp16 = slice_by_index(begin = var_7874_begin_0, end = var_7874_end_0, end_mask = var_7874_end_mask_0, x = transpose_13)[name = tensor("op_7874_cast_fp16")]; + tensor var_7878_begin_0 = const()[name = tensor("op_7878_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_7878_end_0 = const()[name = tensor("op_7878_end_0"), val = tensor([2, 144, 1, 1280])]; + tensor var_7878_end_mask_0 = const()[name = tensor("op_7878_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_7878_cast_fp16 = slice_by_index(begin = var_7878_begin_0, end = var_7878_end_0, end_mask = var_7878_end_mask_0, x = transpose_13)[name = tensor("op_7878_cast_fp16")]; + tensor var_7880_begin_0 = const()[name = tensor("op_7880_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_7880_end_0 = const()[name = tensor("op_7880_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_7880_end_mask_0 = const()[name = tensor("op_7880_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7880_cast_fp16 = slice_by_index(begin = var_7880_begin_0, end = var_7880_end_0, end_mask = var_7880_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7880_cast_fp16")]; + tensor var_7884_begin_0 = const()[name = tensor("op_7884_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_7884_end_0 = const()[name = tensor("op_7884_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_7884_end_mask_0 = const()[name = tensor("op_7884_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7884_cast_fp16 = slice_by_index(begin = var_7884_begin_0, end = var_7884_end_0, end_mask = var_7884_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7884_cast_fp16")]; + tensor var_7888_begin_0 = const()[name = tensor("op_7888_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_7888_end_0 = const()[name = tensor("op_7888_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_7888_end_mask_0 = const()[name = tensor("op_7888_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7888_cast_fp16 = slice_by_index(begin = var_7888_begin_0, end = var_7888_end_0, end_mask = var_7888_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7888_cast_fp16")]; + tensor var_7892_begin_0 = const()[name = tensor("op_7892_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_7892_end_0 = const()[name = tensor("op_7892_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_7892_end_mask_0 = const()[name = tensor("op_7892_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7892_cast_fp16 = slice_by_index(begin = var_7892_begin_0, end = var_7892_end_0, end_mask = var_7892_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7892_cast_fp16")]; + tensor var_7896_begin_0 = const()[name = tensor("op_7896_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_7896_end_0 = const()[name = tensor("op_7896_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_7896_end_mask_0 = const()[name = tensor("op_7896_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7896_cast_fp16 = slice_by_index(begin = var_7896_begin_0, end = var_7896_end_0, end_mask = var_7896_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7896_cast_fp16")]; + tensor var_7900_begin_0 = const()[name = tensor("op_7900_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_7900_end_0 = const()[name = tensor("op_7900_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_7900_end_mask_0 = const()[name = tensor("op_7900_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7900_cast_fp16 = slice_by_index(begin = var_7900_begin_0, end = var_7900_end_0, end_mask = var_7900_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7900_cast_fp16")]; + tensor var_7904_begin_0 = const()[name = tensor("op_7904_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_7904_end_0 = const()[name = tensor("op_7904_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_7904_end_mask_0 = const()[name = tensor("op_7904_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7904_cast_fp16 = slice_by_index(begin = var_7904_begin_0, end = var_7904_end_0, end_mask = var_7904_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7904_cast_fp16")]; + tensor var_7908_begin_0 = const()[name = tensor("op_7908_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_7908_end_0 = const()[name = tensor("op_7908_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_7908_end_mask_0 = const()[name = tensor("op_7908_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7908_cast_fp16 = slice_by_index(begin = var_7908_begin_0, end = var_7908_end_0, end_mask = var_7908_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7908_cast_fp16")]; + tensor var_7912_begin_0 = const()[name = tensor("op_7912_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_7912_end_0 = const()[name = tensor("op_7912_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_7912_end_mask_0 = const()[name = tensor("op_7912_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7912_cast_fp16 = slice_by_index(begin = var_7912_begin_0, end = var_7912_end_0, end_mask = var_7912_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7912_cast_fp16")]; + tensor var_7916_begin_0 = const()[name = tensor("op_7916_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_7916_end_0 = const()[name = tensor("op_7916_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_7916_end_mask_0 = const()[name = tensor("op_7916_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7916_cast_fp16 = slice_by_index(begin = var_7916_begin_0, end = var_7916_end_0, end_mask = var_7916_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7916_cast_fp16")]; + tensor var_7920_begin_0 = const()[name = tensor("op_7920_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_7920_end_0 = const()[name = tensor("op_7920_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_7920_end_mask_0 = const()[name = tensor("op_7920_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7920_cast_fp16 = slice_by_index(begin = var_7920_begin_0, end = var_7920_end_0, end_mask = var_7920_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7920_cast_fp16")]; + tensor var_7924_begin_0 = const()[name = tensor("op_7924_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_7924_end_0 = const()[name = tensor("op_7924_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_7924_end_mask_0 = const()[name = tensor("op_7924_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7924_cast_fp16 = slice_by_index(begin = var_7924_begin_0, end = var_7924_end_0, end_mask = var_7924_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7924_cast_fp16")]; + tensor var_7928_begin_0 = const()[name = tensor("op_7928_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_7928_end_0 = const()[name = tensor("op_7928_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_7928_end_mask_0 = const()[name = tensor("op_7928_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7928_cast_fp16 = slice_by_index(begin = var_7928_begin_0, end = var_7928_end_0, end_mask = var_7928_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7928_cast_fp16")]; + tensor var_7932_begin_0 = const()[name = tensor("op_7932_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_7932_end_0 = const()[name = tensor("op_7932_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_7932_end_mask_0 = const()[name = tensor("op_7932_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7932_cast_fp16 = slice_by_index(begin = var_7932_begin_0, end = var_7932_end_0, end_mask = var_7932_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7932_cast_fp16")]; + tensor var_7936_begin_0 = const()[name = tensor("op_7936_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_7936_end_0 = const()[name = tensor("op_7936_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_7936_end_mask_0 = const()[name = tensor("op_7936_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7936_cast_fp16 = slice_by_index(begin = var_7936_begin_0, end = var_7936_end_0, end_mask = var_7936_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7936_cast_fp16")]; + tensor var_7940_begin_0 = const()[name = tensor("op_7940_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_7940_end_0 = const()[name = tensor("op_7940_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_7940_end_mask_0 = const()[name = tensor("op_7940_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7940_cast_fp16 = slice_by_index(begin = var_7940_begin_0, end = var_7940_end_0, end_mask = var_7940_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7940_cast_fp16")]; + tensor var_7944_begin_0 = const()[name = tensor("op_7944_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_7944_end_0 = const()[name = tensor("op_7944_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_7944_end_mask_0 = const()[name = tensor("op_7944_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7944_cast_fp16 = slice_by_index(begin = var_7944_begin_0, end = var_7944_end_0, end_mask = var_7944_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7944_cast_fp16")]; + tensor var_7948_begin_0 = const()[name = tensor("op_7948_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_7948_end_0 = const()[name = tensor("op_7948_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_7948_end_mask_0 = const()[name = tensor("op_7948_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7948_cast_fp16 = slice_by_index(begin = var_7948_begin_0, end = var_7948_end_0, end_mask = var_7948_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7948_cast_fp16")]; + tensor var_7952_begin_0 = const()[name = tensor("op_7952_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_7952_end_0 = const()[name = tensor("op_7952_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_7952_end_mask_0 = const()[name = tensor("op_7952_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7952_cast_fp16 = slice_by_index(begin = var_7952_begin_0, end = var_7952_end_0, end_mask = var_7952_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7952_cast_fp16")]; + tensor var_7956_begin_0 = const()[name = tensor("op_7956_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_7956_end_0 = const()[name = tensor("op_7956_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_7956_end_mask_0 = const()[name = tensor("op_7956_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_7956_cast_fp16 = slice_by_index(begin = var_7956_begin_0, end = var_7956_end_0, end_mask = var_7956_end_mask_0, x = v_37_cast_fp16)[name = tensor("op_7956_cast_fp16")]; + tensor var_7960_equation_0 = const()[name = tensor("op_7960_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7960_cast_fp16 = einsum(equation = var_7960_equation_0, values = (var_7802_cast_fp16, var_7719_cast_fp16))[name = tensor("op_7960_cast_fp16")]; + tensor var_7961_to_fp16 = const()[name = tensor("op_7961_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_521_cast_fp16 = mul(x = var_7960_cast_fp16, y = var_7961_to_fp16)[name = tensor("aw_521_cast_fp16")]; + tensor var_7964_equation_0 = const()[name = tensor("op_7964_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7964_cast_fp16 = einsum(equation = var_7964_equation_0, values = (var_7806_cast_fp16, var_7723_cast_fp16))[name = tensor("op_7964_cast_fp16")]; + tensor var_7965_to_fp16 = const()[name = tensor("op_7965_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_523_cast_fp16 = mul(x = var_7964_cast_fp16, y = var_7965_to_fp16)[name = tensor("aw_523_cast_fp16")]; + tensor var_7968_equation_0 = const()[name = tensor("op_7968_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7968_cast_fp16 = einsum(equation = var_7968_equation_0, values = (var_7810_cast_fp16, var_7727_cast_fp16))[name = tensor("op_7968_cast_fp16")]; + tensor var_7969_to_fp16 = const()[name = tensor("op_7969_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_525_cast_fp16 = mul(x = var_7968_cast_fp16, y = var_7969_to_fp16)[name = tensor("aw_525_cast_fp16")]; + tensor var_7972_equation_0 = const()[name = tensor("op_7972_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7972_cast_fp16 = einsum(equation = var_7972_equation_0, values = (var_7814_cast_fp16, var_7731_cast_fp16))[name = tensor("op_7972_cast_fp16")]; + tensor var_7973_to_fp16 = const()[name = tensor("op_7973_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_527_cast_fp16 = mul(x = var_7972_cast_fp16, y = var_7973_to_fp16)[name = tensor("aw_527_cast_fp16")]; + tensor var_7976_equation_0 = const()[name = tensor("op_7976_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7976_cast_fp16 = einsum(equation = var_7976_equation_0, values = (var_7818_cast_fp16, var_7735_cast_fp16))[name = tensor("op_7976_cast_fp16")]; + tensor var_7977_to_fp16 = const()[name = tensor("op_7977_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_529_cast_fp16 = mul(x = var_7976_cast_fp16, y = var_7977_to_fp16)[name = tensor("aw_529_cast_fp16")]; + tensor var_7980_equation_0 = const()[name = tensor("op_7980_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7980_cast_fp16 = einsum(equation = var_7980_equation_0, values = (var_7822_cast_fp16, var_7739_cast_fp16))[name = tensor("op_7980_cast_fp16")]; + tensor var_7981_to_fp16 = const()[name = tensor("op_7981_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_531_cast_fp16 = mul(x = var_7980_cast_fp16, y = var_7981_to_fp16)[name = tensor("aw_531_cast_fp16")]; + tensor var_7984_equation_0 = const()[name = tensor("op_7984_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7984_cast_fp16 = einsum(equation = var_7984_equation_0, values = (var_7826_cast_fp16, var_7743_cast_fp16))[name = tensor("op_7984_cast_fp16")]; + tensor var_7985_to_fp16 = const()[name = tensor("op_7985_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_533_cast_fp16 = mul(x = var_7984_cast_fp16, y = var_7985_to_fp16)[name = tensor("aw_533_cast_fp16")]; + tensor var_7988_equation_0 = const()[name = tensor("op_7988_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7988_cast_fp16 = einsum(equation = var_7988_equation_0, values = (var_7830_cast_fp16, var_7747_cast_fp16))[name = tensor("op_7988_cast_fp16")]; + tensor var_7989_to_fp16 = const()[name = tensor("op_7989_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_535_cast_fp16 = mul(x = var_7988_cast_fp16, y = var_7989_to_fp16)[name = tensor("aw_535_cast_fp16")]; + tensor var_7992_equation_0 = const()[name = tensor("op_7992_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7992_cast_fp16 = einsum(equation = var_7992_equation_0, values = (var_7834_cast_fp16, var_7751_cast_fp16))[name = tensor("op_7992_cast_fp16")]; + tensor var_7993_to_fp16 = const()[name = tensor("op_7993_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_537_cast_fp16 = mul(x = var_7992_cast_fp16, y = var_7993_to_fp16)[name = tensor("aw_537_cast_fp16")]; + tensor var_7996_equation_0 = const()[name = tensor("op_7996_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_7996_cast_fp16 = einsum(equation = var_7996_equation_0, values = (var_7838_cast_fp16, var_7755_cast_fp16))[name = tensor("op_7996_cast_fp16")]; + tensor var_7997_to_fp16 = const()[name = tensor("op_7997_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_539_cast_fp16 = mul(x = var_7996_cast_fp16, y = var_7997_to_fp16)[name = tensor("aw_539_cast_fp16")]; + tensor var_8000_equation_0 = const()[name = tensor("op_8000_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8000_cast_fp16 = einsum(equation = var_8000_equation_0, values = (var_7842_cast_fp16, var_7759_cast_fp16))[name = tensor("op_8000_cast_fp16")]; + tensor var_8001_to_fp16 = const()[name = tensor("op_8001_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_541_cast_fp16 = mul(x = var_8000_cast_fp16, y = var_8001_to_fp16)[name = tensor("aw_541_cast_fp16")]; + tensor var_8004_equation_0 = const()[name = tensor("op_8004_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8004_cast_fp16 = einsum(equation = var_8004_equation_0, values = (var_7846_cast_fp16, var_7763_cast_fp16))[name = tensor("op_8004_cast_fp16")]; + tensor var_8005_to_fp16 = const()[name = tensor("op_8005_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_543_cast_fp16 = mul(x = var_8004_cast_fp16, y = var_8005_to_fp16)[name = tensor("aw_543_cast_fp16")]; + tensor var_8008_equation_0 = const()[name = tensor("op_8008_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8008_cast_fp16 = einsum(equation = var_8008_equation_0, values = (var_7850_cast_fp16, var_7767_cast_fp16))[name = tensor("op_8008_cast_fp16")]; + tensor var_8009_to_fp16 = const()[name = tensor("op_8009_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_545_cast_fp16 = mul(x = var_8008_cast_fp16, y = var_8009_to_fp16)[name = tensor("aw_545_cast_fp16")]; + tensor var_8012_equation_0 = const()[name = tensor("op_8012_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8012_cast_fp16 = einsum(equation = var_8012_equation_0, values = (var_7854_cast_fp16, var_7771_cast_fp16))[name = tensor("op_8012_cast_fp16")]; + tensor var_8013_to_fp16 = const()[name = tensor("op_8013_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_547_cast_fp16 = mul(x = var_8012_cast_fp16, y = var_8013_to_fp16)[name = tensor("aw_547_cast_fp16")]; + tensor var_8016_equation_0 = const()[name = tensor("op_8016_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8016_cast_fp16 = einsum(equation = var_8016_equation_0, values = (var_7858_cast_fp16, var_7775_cast_fp16))[name = tensor("op_8016_cast_fp16")]; + tensor var_8017_to_fp16 = const()[name = tensor("op_8017_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_549_cast_fp16 = mul(x = var_8016_cast_fp16, y = var_8017_to_fp16)[name = tensor("aw_549_cast_fp16")]; + tensor var_8020_equation_0 = const()[name = tensor("op_8020_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8020_cast_fp16 = einsum(equation = var_8020_equation_0, values = (var_7862_cast_fp16, var_7779_cast_fp16))[name = tensor("op_8020_cast_fp16")]; + tensor var_8021_to_fp16 = const()[name = tensor("op_8021_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_551_cast_fp16 = mul(x = var_8020_cast_fp16, y = var_8021_to_fp16)[name = tensor("aw_551_cast_fp16")]; + tensor var_8024_equation_0 = const()[name = tensor("op_8024_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8024_cast_fp16 = einsum(equation = var_8024_equation_0, values = (var_7866_cast_fp16, var_7783_cast_fp16))[name = tensor("op_8024_cast_fp16")]; + tensor var_8025_to_fp16 = const()[name = tensor("op_8025_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_553_cast_fp16 = mul(x = var_8024_cast_fp16, y = var_8025_to_fp16)[name = tensor("aw_553_cast_fp16")]; + tensor var_8028_equation_0 = const()[name = tensor("op_8028_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8028_cast_fp16 = einsum(equation = var_8028_equation_0, values = (var_7870_cast_fp16, var_7787_cast_fp16))[name = tensor("op_8028_cast_fp16")]; + tensor var_8029_to_fp16 = const()[name = tensor("op_8029_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_555_cast_fp16 = mul(x = var_8028_cast_fp16, y = var_8029_to_fp16)[name = tensor("aw_555_cast_fp16")]; + tensor var_8032_equation_0 = const()[name = tensor("op_8032_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8032_cast_fp16 = einsum(equation = var_8032_equation_0, values = (var_7874_cast_fp16, var_7791_cast_fp16))[name = tensor("op_8032_cast_fp16")]; + tensor var_8033_to_fp16 = const()[name = tensor("op_8033_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_557_cast_fp16 = mul(x = var_8032_cast_fp16, y = var_8033_to_fp16)[name = tensor("aw_557_cast_fp16")]; + tensor var_8036_equation_0 = const()[name = tensor("op_8036_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8036_cast_fp16 = einsum(equation = var_8036_equation_0, values = (var_7878_cast_fp16, var_7795_cast_fp16))[name = tensor("op_8036_cast_fp16")]; + tensor var_8037_to_fp16 = const()[name = tensor("op_8037_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_559_cast_fp16 = mul(x = var_8036_cast_fp16, y = var_8037_to_fp16)[name = tensor("aw_559_cast_fp16")]; + tensor var_8039_cast_fp16 = softmax(axis = var_5599, x = aw_521_cast_fp16)[name = tensor("op_8039_cast_fp16")]; + tensor var_8040_cast_fp16 = softmax(axis = var_5599, x = aw_523_cast_fp16)[name = tensor("op_8040_cast_fp16")]; + tensor var_8041_cast_fp16 = softmax(axis = var_5599, x = aw_525_cast_fp16)[name = tensor("op_8041_cast_fp16")]; + tensor var_8042_cast_fp16 = softmax(axis = var_5599, x = aw_527_cast_fp16)[name = tensor("op_8042_cast_fp16")]; + tensor var_8043_cast_fp16 = softmax(axis = var_5599, x = aw_529_cast_fp16)[name = tensor("op_8043_cast_fp16")]; + tensor var_8044_cast_fp16 = softmax(axis = var_5599, x = aw_531_cast_fp16)[name = tensor("op_8044_cast_fp16")]; + tensor var_8045_cast_fp16 = softmax(axis = var_5599, x = aw_533_cast_fp16)[name = tensor("op_8045_cast_fp16")]; + tensor var_8046_cast_fp16 = softmax(axis = var_5599, x = aw_535_cast_fp16)[name = tensor("op_8046_cast_fp16")]; + tensor var_8047_cast_fp16 = softmax(axis = var_5599, x = aw_537_cast_fp16)[name = tensor("op_8047_cast_fp16")]; + tensor var_8048_cast_fp16 = softmax(axis = var_5599, x = aw_539_cast_fp16)[name = tensor("op_8048_cast_fp16")]; + tensor var_8049_cast_fp16 = softmax(axis = var_5599, x = aw_541_cast_fp16)[name = tensor("op_8049_cast_fp16")]; + tensor var_8050_cast_fp16 = softmax(axis = var_5599, x = aw_543_cast_fp16)[name = tensor("op_8050_cast_fp16")]; + tensor var_8051_cast_fp16 = softmax(axis = var_5599, x = aw_545_cast_fp16)[name = tensor("op_8051_cast_fp16")]; + tensor var_8052_cast_fp16 = softmax(axis = var_5599, x = aw_547_cast_fp16)[name = tensor("op_8052_cast_fp16")]; + tensor var_8053_cast_fp16 = softmax(axis = var_5599, x = aw_549_cast_fp16)[name = tensor("op_8053_cast_fp16")]; + tensor var_8054_cast_fp16 = softmax(axis = var_5599, x = aw_551_cast_fp16)[name = tensor("op_8054_cast_fp16")]; + tensor var_8055_cast_fp16 = softmax(axis = var_5599, x = aw_553_cast_fp16)[name = tensor("op_8055_cast_fp16")]; + tensor var_8056_cast_fp16 = softmax(axis = var_5599, x = aw_555_cast_fp16)[name = tensor("op_8056_cast_fp16")]; + tensor var_8057_cast_fp16 = softmax(axis = var_5599, x = aw_557_cast_fp16)[name = tensor("op_8057_cast_fp16")]; + tensor var_8058_cast_fp16 = softmax(axis = var_5599, x = aw_559_cast_fp16)[name = tensor("op_8058_cast_fp16")]; + tensor var_8060_equation_0 = const()[name = tensor("op_8060_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8060_cast_fp16 = einsum(equation = var_8060_equation_0, values = (var_7880_cast_fp16, var_8039_cast_fp16))[name = tensor("op_8060_cast_fp16")]; + tensor var_8062_equation_0 = const()[name = tensor("op_8062_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8062_cast_fp16 = einsum(equation = var_8062_equation_0, values = (var_7884_cast_fp16, var_8040_cast_fp16))[name = tensor("op_8062_cast_fp16")]; + tensor var_8064_equation_0 = const()[name = tensor("op_8064_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8064_cast_fp16 = einsum(equation = var_8064_equation_0, values = (var_7888_cast_fp16, var_8041_cast_fp16))[name = tensor("op_8064_cast_fp16")]; + tensor var_8066_equation_0 = const()[name = tensor("op_8066_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8066_cast_fp16 = einsum(equation = var_8066_equation_0, values = (var_7892_cast_fp16, var_8042_cast_fp16))[name = tensor("op_8066_cast_fp16")]; + tensor var_8068_equation_0 = const()[name = tensor("op_8068_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8068_cast_fp16 = einsum(equation = var_8068_equation_0, values = (var_7896_cast_fp16, var_8043_cast_fp16))[name = tensor("op_8068_cast_fp16")]; + tensor var_8070_equation_0 = const()[name = tensor("op_8070_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8070_cast_fp16 = einsum(equation = var_8070_equation_0, values = (var_7900_cast_fp16, var_8044_cast_fp16))[name = tensor("op_8070_cast_fp16")]; + tensor var_8072_equation_0 = const()[name = tensor("op_8072_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8072_cast_fp16 = einsum(equation = var_8072_equation_0, values = (var_7904_cast_fp16, var_8045_cast_fp16))[name = tensor("op_8072_cast_fp16")]; + tensor var_8074_equation_0 = const()[name = tensor("op_8074_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8074_cast_fp16 = einsum(equation = var_8074_equation_0, values = (var_7908_cast_fp16, var_8046_cast_fp16))[name = tensor("op_8074_cast_fp16")]; + tensor var_8076_equation_0 = const()[name = tensor("op_8076_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8076_cast_fp16 = einsum(equation = var_8076_equation_0, values = (var_7912_cast_fp16, var_8047_cast_fp16))[name = tensor("op_8076_cast_fp16")]; + tensor var_8078_equation_0 = const()[name = tensor("op_8078_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8078_cast_fp16 = einsum(equation = var_8078_equation_0, values = (var_7916_cast_fp16, var_8048_cast_fp16))[name = tensor("op_8078_cast_fp16")]; + tensor var_8080_equation_0 = const()[name = tensor("op_8080_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8080_cast_fp16 = einsum(equation = var_8080_equation_0, values = (var_7920_cast_fp16, var_8049_cast_fp16))[name = tensor("op_8080_cast_fp16")]; + tensor var_8082_equation_0 = const()[name = tensor("op_8082_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8082_cast_fp16 = einsum(equation = var_8082_equation_0, values = (var_7924_cast_fp16, var_8050_cast_fp16))[name = tensor("op_8082_cast_fp16")]; + tensor var_8084_equation_0 = const()[name = tensor("op_8084_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8084_cast_fp16 = einsum(equation = var_8084_equation_0, values = (var_7928_cast_fp16, var_8051_cast_fp16))[name = tensor("op_8084_cast_fp16")]; + tensor var_8086_equation_0 = const()[name = tensor("op_8086_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8086_cast_fp16 = einsum(equation = var_8086_equation_0, values = (var_7932_cast_fp16, var_8052_cast_fp16))[name = tensor("op_8086_cast_fp16")]; + tensor var_8088_equation_0 = const()[name = tensor("op_8088_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8088_cast_fp16 = einsum(equation = var_8088_equation_0, values = (var_7936_cast_fp16, var_8053_cast_fp16))[name = tensor("op_8088_cast_fp16")]; + tensor var_8090_equation_0 = const()[name = tensor("op_8090_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8090_cast_fp16 = einsum(equation = var_8090_equation_0, values = (var_7940_cast_fp16, var_8054_cast_fp16))[name = tensor("op_8090_cast_fp16")]; + tensor var_8092_equation_0 = const()[name = tensor("op_8092_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8092_cast_fp16 = einsum(equation = var_8092_equation_0, values = (var_7944_cast_fp16, var_8055_cast_fp16))[name = tensor("op_8092_cast_fp16")]; + tensor var_8094_equation_0 = const()[name = tensor("op_8094_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8094_cast_fp16 = einsum(equation = var_8094_equation_0, values = (var_7948_cast_fp16, var_8056_cast_fp16))[name = tensor("op_8094_cast_fp16")]; + tensor var_8096_equation_0 = const()[name = tensor("op_8096_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8096_cast_fp16 = einsum(equation = var_8096_equation_0, values = (var_7952_cast_fp16, var_8057_cast_fp16))[name = tensor("op_8096_cast_fp16")]; + tensor var_8098_equation_0 = const()[name = tensor("op_8098_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8098_cast_fp16 = einsum(equation = var_8098_equation_0, values = (var_7956_cast_fp16, var_8058_cast_fp16))[name = tensor("op_8098_cast_fp16")]; + tensor input_353_interleave_0 = const()[name = tensor("input_353_interleave_0"), val = tensor(false)]; + tensor input_353_cast_fp16 = concat(axis = var_5599, interleave = input_353_interleave_0, values = (var_8060_cast_fp16, var_8062_cast_fp16, var_8064_cast_fp16, var_8066_cast_fp16, var_8068_cast_fp16, var_8070_cast_fp16, var_8072_cast_fp16, var_8074_cast_fp16, var_8076_cast_fp16, var_8078_cast_fp16, var_8080_cast_fp16, var_8082_cast_fp16, var_8084_cast_fp16, var_8086_cast_fp16, var_8088_cast_fp16, var_8090_cast_fp16, var_8092_cast_fp16, var_8094_cast_fp16, var_8096_cast_fp16, var_8098_cast_fp16))[name = tensor("input_353_cast_fp16")]; + tensor var_8104 = const()[name = tensor("op_8104"), val = tensor([1, 1])]; + tensor var_8106 = const()[name = tensor("op_8106"), val = tensor([1, 1])]; + tensor var_8108_pad_type_0 = const()[name = tensor("op_8108_pad_type_0"), val = tensor("custom")]; + tensor var_8108_pad_0 = const()[name = tensor("op_8108_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1461249920)))]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1464526784)))]; + tensor var_8108_cast_fp16 = conv(bias = up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_8106, groups = var_5599, pad = var_8108_pad_0, pad_type = var_8108_pad_type_0, strides = var_8104, weight = up_blocks_1_attentions_2_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_353_cast_fp16)[name = tensor("op_8108_cast_fp16")]; + tensor inputs_57_cast_fp16 = add(x = var_8108_cast_fp16, y = inputs_55_cast_fp16)[name = tensor("inputs_57_cast_fp16")]; + tensor var_8112 = const()[name = tensor("op_8112"), val = tensor([1])]; + tensor channels_mean_57_cast_fp16 = reduce_mean(axes = var_8112, keep_dims = var_5594, x = inputs_57_cast_fp16)[name = tensor("channels_mean_57_cast_fp16")]; + tensor zero_mean_57_cast_fp16 = sub(x = inputs_57_cast_fp16, y = channels_mean_57_cast_fp16)[name = tensor("zero_mean_57_cast_fp16")]; + tensor zero_mean_sq_57_cast_fp16 = mul(x = zero_mean_57_cast_fp16, y = zero_mean_57_cast_fp16)[name = tensor("zero_mean_sq_57_cast_fp16")]; + tensor var_8116 = const()[name = tensor("op_8116"), val = tensor([1])]; + tensor var_8117_cast_fp16 = reduce_mean(axes = var_8116, keep_dims = var_5594, x = zero_mean_sq_57_cast_fp16)[name = tensor("op_8117_cast_fp16")]; + tensor var_8118_to_fp16 = const()[name = tensor("op_8118_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_8119_cast_fp16 = add(x = var_8117_cast_fp16, y = var_8118_to_fp16)[name = tensor("op_8119_cast_fp16")]; + tensor denom_57_epsilon_0_to_fp16 = const()[name = tensor("denom_57_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_57_cast_fp16 = rsqrt(epsilon = denom_57_epsilon_0_to_fp16, x = var_8119_cast_fp16)[name = tensor("denom_57_cast_fp16")]; + tensor out_57_cast_fp16 = mul(x = zero_mean_57_cast_fp16, y = denom_57_cast_fp16)[name = tensor("out_57_cast_fp16")]; + tensor var_8123_to_fp16 = const()[name = tensor("op_8123_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1464529408)))]; + tensor var_8124_cast_fp16 = add(x = out_57_cast_fp16, y = var_8123_to_fp16)[name = tensor("op_8124_cast_fp16")]; + tensor var_8126_to_fp16 = const()[name = tensor("op_8126_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1464532032)))]; + tensor hidden_states_209_cast_fp16 = mul(x = var_8124_cast_fp16, y = var_8126_to_fp16)[name = tensor("hidden_states_209_cast_fp16")]; + tensor var_8133 = const()[name = tensor("op_8133"), val = tensor([1, 1])]; + tensor var_8135 = const()[name = tensor("op_8135"), val = tensor([1, 1])]; + tensor q_39_pad_type_0 = const()[name = tensor("q_39_pad_type_0"), val = tensor("custom")]; + tensor q_39_pad_0 = const()[name = tensor("q_39_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1464534656)))]; + tensor q_39_cast_fp16 = conv(dilations = var_8135, groups = var_5599, pad = q_39_pad_0, pad_type = q_39_pad_type_0, strides = var_8133, weight = up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_209_cast_fp16)[name = tensor("q_39_cast_fp16")]; + tensor var_8139 = const()[name = tensor("op_8139"), val = tensor([1, 1])]; + tensor var_8141 = const()[name = tensor("op_8141"), val = tensor([1, 1])]; + tensor k_77_pad_type_0 = const()[name = tensor("k_77_pad_type_0"), val = tensor("custom")]; + tensor k_77_pad_0 = const()[name = tensor("k_77_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1467811520)))]; + tensor k_77_cast_fp16 = conv(dilations = var_8141, groups = var_5599, pad = k_77_pad_0, pad_type = k_77_pad_type_0, strides = var_8139, weight = up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_77_cast_fp16")]; + tensor var_8145 = const()[name = tensor("op_8145"), val = tensor([1, 1])]; + tensor var_8147 = const()[name = tensor("op_8147"), val = tensor([1, 1])]; + tensor v_39_pad_type_0 = const()[name = tensor("v_39_pad_type_0"), val = tensor("custom")]; + tensor v_39_pad_0 = const()[name = tensor("v_39_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1470433024)))]; + tensor v_39_cast_fp16 = conv(dilations = var_8147, groups = var_5599, pad = v_39_pad_0, pad_type = v_39_pad_type_0, strides = var_8145, weight = up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_39_cast_fp16")]; + tensor var_8151_begin_0 = const()[name = tensor("op_8151_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_8151_end_0 = const()[name = tensor("op_8151_end_0"), val = tensor([2, 64, 1, 144])]; + tensor var_8151_end_mask_0 = const()[name = tensor("op_8151_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8151_cast_fp16 = slice_by_index(begin = var_8151_begin_0, end = var_8151_end_0, end_mask = var_8151_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8151_cast_fp16")]; + tensor var_8155_begin_0 = const()[name = tensor("op_8155_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_8155_end_0 = const()[name = tensor("op_8155_end_0"), val = tensor([2, 128, 1, 144])]; + tensor var_8155_end_mask_0 = const()[name = tensor("op_8155_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8155_cast_fp16 = slice_by_index(begin = var_8155_begin_0, end = var_8155_end_0, end_mask = var_8155_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8155_cast_fp16")]; + tensor var_8159_begin_0 = const()[name = tensor("op_8159_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_8159_end_0 = const()[name = tensor("op_8159_end_0"), val = tensor([2, 192, 1, 144])]; + tensor var_8159_end_mask_0 = const()[name = tensor("op_8159_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8159_cast_fp16 = slice_by_index(begin = var_8159_begin_0, end = var_8159_end_0, end_mask = var_8159_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8159_cast_fp16")]; + tensor var_8163_begin_0 = const()[name = tensor("op_8163_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_8163_end_0 = const()[name = tensor("op_8163_end_0"), val = tensor([2, 256, 1, 144])]; + tensor var_8163_end_mask_0 = const()[name = tensor("op_8163_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8163_cast_fp16 = slice_by_index(begin = var_8163_begin_0, end = var_8163_end_0, end_mask = var_8163_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8163_cast_fp16")]; + tensor var_8167_begin_0 = const()[name = tensor("op_8167_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_8167_end_0 = const()[name = tensor("op_8167_end_0"), val = tensor([2, 320, 1, 144])]; + tensor var_8167_end_mask_0 = const()[name = tensor("op_8167_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8167_cast_fp16 = slice_by_index(begin = var_8167_begin_0, end = var_8167_end_0, end_mask = var_8167_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8167_cast_fp16")]; + tensor var_8171_begin_0 = const()[name = tensor("op_8171_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_8171_end_0 = const()[name = tensor("op_8171_end_0"), val = tensor([2, 384, 1, 144])]; + tensor var_8171_end_mask_0 = const()[name = tensor("op_8171_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8171_cast_fp16 = slice_by_index(begin = var_8171_begin_0, end = var_8171_end_0, end_mask = var_8171_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8171_cast_fp16")]; + tensor var_8175_begin_0 = const()[name = tensor("op_8175_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_8175_end_0 = const()[name = tensor("op_8175_end_0"), val = tensor([2, 448, 1, 144])]; + tensor var_8175_end_mask_0 = const()[name = tensor("op_8175_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8175_cast_fp16 = slice_by_index(begin = var_8175_begin_0, end = var_8175_end_0, end_mask = var_8175_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8175_cast_fp16")]; + tensor var_8179_begin_0 = const()[name = tensor("op_8179_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_8179_end_0 = const()[name = tensor("op_8179_end_0"), val = tensor([2, 512, 1, 144])]; + tensor var_8179_end_mask_0 = const()[name = tensor("op_8179_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8179_cast_fp16 = slice_by_index(begin = var_8179_begin_0, end = var_8179_end_0, end_mask = var_8179_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8179_cast_fp16")]; + tensor var_8183_begin_0 = const()[name = tensor("op_8183_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_8183_end_0 = const()[name = tensor("op_8183_end_0"), val = tensor([2, 576, 1, 144])]; + tensor var_8183_end_mask_0 = const()[name = tensor("op_8183_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8183_cast_fp16 = slice_by_index(begin = var_8183_begin_0, end = var_8183_end_0, end_mask = var_8183_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8183_cast_fp16")]; + tensor var_8187_begin_0 = const()[name = tensor("op_8187_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_8187_end_0 = const()[name = tensor("op_8187_end_0"), val = tensor([2, 640, 1, 144])]; + tensor var_8187_end_mask_0 = const()[name = tensor("op_8187_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8187_cast_fp16 = slice_by_index(begin = var_8187_begin_0, end = var_8187_end_0, end_mask = var_8187_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8187_cast_fp16")]; + tensor var_8191_begin_0 = const()[name = tensor("op_8191_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_8191_end_0 = const()[name = tensor("op_8191_end_0"), val = tensor([2, 704, 1, 144])]; + tensor var_8191_end_mask_0 = const()[name = tensor("op_8191_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8191_cast_fp16 = slice_by_index(begin = var_8191_begin_0, end = var_8191_end_0, end_mask = var_8191_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8191_cast_fp16")]; + tensor var_8195_begin_0 = const()[name = tensor("op_8195_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_8195_end_0 = const()[name = tensor("op_8195_end_0"), val = tensor([2, 768, 1, 144])]; + tensor var_8195_end_mask_0 = const()[name = tensor("op_8195_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8195_cast_fp16 = slice_by_index(begin = var_8195_begin_0, end = var_8195_end_0, end_mask = var_8195_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8195_cast_fp16")]; + tensor var_8199_begin_0 = const()[name = tensor("op_8199_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_8199_end_0 = const()[name = tensor("op_8199_end_0"), val = tensor([2, 832, 1, 144])]; + tensor var_8199_end_mask_0 = const()[name = tensor("op_8199_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8199_cast_fp16 = slice_by_index(begin = var_8199_begin_0, end = var_8199_end_0, end_mask = var_8199_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8199_cast_fp16")]; + tensor var_8203_begin_0 = const()[name = tensor("op_8203_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_8203_end_0 = const()[name = tensor("op_8203_end_0"), val = tensor([2, 896, 1, 144])]; + tensor var_8203_end_mask_0 = const()[name = tensor("op_8203_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8203_cast_fp16 = slice_by_index(begin = var_8203_begin_0, end = var_8203_end_0, end_mask = var_8203_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8203_cast_fp16")]; + tensor var_8207_begin_0 = const()[name = tensor("op_8207_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_8207_end_0 = const()[name = tensor("op_8207_end_0"), val = tensor([2, 960, 1, 144])]; + tensor var_8207_end_mask_0 = const()[name = tensor("op_8207_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8207_cast_fp16 = slice_by_index(begin = var_8207_begin_0, end = var_8207_end_0, end_mask = var_8207_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8207_cast_fp16")]; + tensor var_8211_begin_0 = const()[name = tensor("op_8211_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_8211_end_0 = const()[name = tensor("op_8211_end_0"), val = tensor([2, 1024, 1, 144])]; + tensor var_8211_end_mask_0 = const()[name = tensor("op_8211_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8211_cast_fp16 = slice_by_index(begin = var_8211_begin_0, end = var_8211_end_0, end_mask = var_8211_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8211_cast_fp16")]; + tensor var_8215_begin_0 = const()[name = tensor("op_8215_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_8215_end_0 = const()[name = tensor("op_8215_end_0"), val = tensor([2, 1088, 1, 144])]; + tensor var_8215_end_mask_0 = const()[name = tensor("op_8215_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8215_cast_fp16 = slice_by_index(begin = var_8215_begin_0, end = var_8215_end_0, end_mask = var_8215_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8215_cast_fp16")]; + tensor var_8219_begin_0 = const()[name = tensor("op_8219_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_8219_end_0 = const()[name = tensor("op_8219_end_0"), val = tensor([2, 1152, 1, 144])]; + tensor var_8219_end_mask_0 = const()[name = tensor("op_8219_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8219_cast_fp16 = slice_by_index(begin = var_8219_begin_0, end = var_8219_end_0, end_mask = var_8219_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8219_cast_fp16")]; + tensor var_8223_begin_0 = const()[name = tensor("op_8223_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_8223_end_0 = const()[name = tensor("op_8223_end_0"), val = tensor([2, 1216, 1, 144])]; + tensor var_8223_end_mask_0 = const()[name = tensor("op_8223_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8223_cast_fp16 = slice_by_index(begin = var_8223_begin_0, end = var_8223_end_0, end_mask = var_8223_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8223_cast_fp16")]; + tensor var_8227_begin_0 = const()[name = tensor("op_8227_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_8227_end_0 = const()[name = tensor("op_8227_end_0"), val = tensor([2, 1280, 1, 144])]; + tensor var_8227_end_mask_0 = const()[name = tensor("op_8227_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8227_cast_fp16 = slice_by_index(begin = var_8227_begin_0, end = var_8227_end_0, end_mask = var_8227_end_mask_0, x = q_39_cast_fp16)[name = tensor("op_8227_cast_fp16")]; + tensor k_79_perm_0 = const()[name = tensor("k_79_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_8234_begin_0 = const()[name = tensor("op_8234_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_8234_end_0 = const()[name = tensor("op_8234_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_8234_end_mask_0 = const()[name = tensor("op_8234_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_12 = transpose(perm = k_79_perm_0, x = k_77_cast_fp16)[name = tensor("transpose_12")]; + tensor var_8234_cast_fp16 = slice_by_index(begin = var_8234_begin_0, end = var_8234_end_0, end_mask = var_8234_end_mask_0, x = transpose_12)[name = tensor("op_8234_cast_fp16")]; + tensor var_8238_begin_0 = const()[name = tensor("op_8238_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_8238_end_0 = const()[name = tensor("op_8238_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_8238_end_mask_0 = const()[name = tensor("op_8238_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8238_cast_fp16 = slice_by_index(begin = var_8238_begin_0, end = var_8238_end_0, end_mask = var_8238_end_mask_0, x = transpose_12)[name = tensor("op_8238_cast_fp16")]; + tensor var_8242_begin_0 = const()[name = tensor("op_8242_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_8242_end_0 = const()[name = tensor("op_8242_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_8242_end_mask_0 = const()[name = tensor("op_8242_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8242_cast_fp16 = slice_by_index(begin = var_8242_begin_0, end = var_8242_end_0, end_mask = var_8242_end_mask_0, x = transpose_12)[name = tensor("op_8242_cast_fp16")]; + tensor var_8246_begin_0 = const()[name = tensor("op_8246_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_8246_end_0 = const()[name = tensor("op_8246_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_8246_end_mask_0 = const()[name = tensor("op_8246_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8246_cast_fp16 = slice_by_index(begin = var_8246_begin_0, end = var_8246_end_0, end_mask = var_8246_end_mask_0, x = transpose_12)[name = tensor("op_8246_cast_fp16")]; + tensor var_8250_begin_0 = const()[name = tensor("op_8250_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_8250_end_0 = const()[name = tensor("op_8250_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_8250_end_mask_0 = const()[name = tensor("op_8250_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8250_cast_fp16 = slice_by_index(begin = var_8250_begin_0, end = var_8250_end_0, end_mask = var_8250_end_mask_0, x = transpose_12)[name = tensor("op_8250_cast_fp16")]; + tensor var_8254_begin_0 = const()[name = tensor("op_8254_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_8254_end_0 = const()[name = tensor("op_8254_end_0"), val = tensor([2, 77, 1, 384])]; + tensor var_8254_end_mask_0 = const()[name = tensor("op_8254_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8254_cast_fp16 = slice_by_index(begin = var_8254_begin_0, end = var_8254_end_0, end_mask = var_8254_end_mask_0, x = transpose_12)[name = tensor("op_8254_cast_fp16")]; + tensor var_8258_begin_0 = const()[name = tensor("op_8258_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_8258_end_0 = const()[name = tensor("op_8258_end_0"), val = tensor([2, 77, 1, 448])]; + tensor var_8258_end_mask_0 = const()[name = tensor("op_8258_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8258_cast_fp16 = slice_by_index(begin = var_8258_begin_0, end = var_8258_end_0, end_mask = var_8258_end_mask_0, x = transpose_12)[name = tensor("op_8258_cast_fp16")]; + tensor var_8262_begin_0 = const()[name = tensor("op_8262_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_8262_end_0 = const()[name = tensor("op_8262_end_0"), val = tensor([2, 77, 1, 512])]; + tensor var_8262_end_mask_0 = const()[name = tensor("op_8262_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8262_cast_fp16 = slice_by_index(begin = var_8262_begin_0, end = var_8262_end_0, end_mask = var_8262_end_mask_0, x = transpose_12)[name = tensor("op_8262_cast_fp16")]; + tensor var_8266_begin_0 = const()[name = tensor("op_8266_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_8266_end_0 = const()[name = tensor("op_8266_end_0"), val = tensor([2, 77, 1, 576])]; + tensor var_8266_end_mask_0 = const()[name = tensor("op_8266_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8266_cast_fp16 = slice_by_index(begin = var_8266_begin_0, end = var_8266_end_0, end_mask = var_8266_end_mask_0, x = transpose_12)[name = tensor("op_8266_cast_fp16")]; + tensor var_8270_begin_0 = const()[name = tensor("op_8270_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_8270_end_0 = const()[name = tensor("op_8270_end_0"), val = tensor([2, 77, 1, 640])]; + tensor var_8270_end_mask_0 = const()[name = tensor("op_8270_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8270_cast_fp16 = slice_by_index(begin = var_8270_begin_0, end = var_8270_end_0, end_mask = var_8270_end_mask_0, x = transpose_12)[name = tensor("op_8270_cast_fp16")]; + tensor var_8274_begin_0 = const()[name = tensor("op_8274_begin_0"), val = tensor([0, 0, 0, 640])]; + tensor var_8274_end_0 = const()[name = tensor("op_8274_end_0"), val = tensor([2, 77, 1, 704])]; + tensor var_8274_end_mask_0 = const()[name = tensor("op_8274_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8274_cast_fp16 = slice_by_index(begin = var_8274_begin_0, end = var_8274_end_0, end_mask = var_8274_end_mask_0, x = transpose_12)[name = tensor("op_8274_cast_fp16")]; + tensor var_8278_begin_0 = const()[name = tensor("op_8278_begin_0"), val = tensor([0, 0, 0, 704])]; + tensor var_8278_end_0 = const()[name = tensor("op_8278_end_0"), val = tensor([2, 77, 1, 768])]; + tensor var_8278_end_mask_0 = const()[name = tensor("op_8278_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8278_cast_fp16 = slice_by_index(begin = var_8278_begin_0, end = var_8278_end_0, end_mask = var_8278_end_mask_0, x = transpose_12)[name = tensor("op_8278_cast_fp16")]; + tensor var_8282_begin_0 = const()[name = tensor("op_8282_begin_0"), val = tensor([0, 0, 0, 768])]; + tensor var_8282_end_0 = const()[name = tensor("op_8282_end_0"), val = tensor([2, 77, 1, 832])]; + tensor var_8282_end_mask_0 = const()[name = tensor("op_8282_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8282_cast_fp16 = slice_by_index(begin = var_8282_begin_0, end = var_8282_end_0, end_mask = var_8282_end_mask_0, x = transpose_12)[name = tensor("op_8282_cast_fp16")]; + tensor var_8286_begin_0 = const()[name = tensor("op_8286_begin_0"), val = tensor([0, 0, 0, 832])]; + tensor var_8286_end_0 = const()[name = tensor("op_8286_end_0"), val = tensor([2, 77, 1, 896])]; + tensor var_8286_end_mask_0 = const()[name = tensor("op_8286_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8286_cast_fp16 = slice_by_index(begin = var_8286_begin_0, end = var_8286_end_0, end_mask = var_8286_end_mask_0, x = transpose_12)[name = tensor("op_8286_cast_fp16")]; + tensor var_8290_begin_0 = const()[name = tensor("op_8290_begin_0"), val = tensor([0, 0, 0, 896])]; + tensor var_8290_end_0 = const()[name = tensor("op_8290_end_0"), val = tensor([2, 77, 1, 960])]; + tensor var_8290_end_mask_0 = const()[name = tensor("op_8290_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8290_cast_fp16 = slice_by_index(begin = var_8290_begin_0, end = var_8290_end_0, end_mask = var_8290_end_mask_0, x = transpose_12)[name = tensor("op_8290_cast_fp16")]; + tensor var_8294_begin_0 = const()[name = tensor("op_8294_begin_0"), val = tensor([0, 0, 0, 960])]; + tensor var_8294_end_0 = const()[name = tensor("op_8294_end_0"), val = tensor([2, 77, 1, 1024])]; + tensor var_8294_end_mask_0 = const()[name = tensor("op_8294_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8294_cast_fp16 = slice_by_index(begin = var_8294_begin_0, end = var_8294_end_0, end_mask = var_8294_end_mask_0, x = transpose_12)[name = tensor("op_8294_cast_fp16")]; + tensor var_8298_begin_0 = const()[name = tensor("op_8298_begin_0"), val = tensor([0, 0, 0, 1024])]; + tensor var_8298_end_0 = const()[name = tensor("op_8298_end_0"), val = tensor([2, 77, 1, 1088])]; + tensor var_8298_end_mask_0 = const()[name = tensor("op_8298_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8298_cast_fp16 = slice_by_index(begin = var_8298_begin_0, end = var_8298_end_0, end_mask = var_8298_end_mask_0, x = transpose_12)[name = tensor("op_8298_cast_fp16")]; + tensor var_8302_begin_0 = const()[name = tensor("op_8302_begin_0"), val = tensor([0, 0, 0, 1088])]; + tensor var_8302_end_0 = const()[name = tensor("op_8302_end_0"), val = tensor([2, 77, 1, 1152])]; + tensor var_8302_end_mask_0 = const()[name = tensor("op_8302_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8302_cast_fp16 = slice_by_index(begin = var_8302_begin_0, end = var_8302_end_0, end_mask = var_8302_end_mask_0, x = transpose_12)[name = tensor("op_8302_cast_fp16")]; + tensor var_8306_begin_0 = const()[name = tensor("op_8306_begin_0"), val = tensor([0, 0, 0, 1152])]; + tensor var_8306_end_0 = const()[name = tensor("op_8306_end_0"), val = tensor([2, 77, 1, 1216])]; + tensor var_8306_end_mask_0 = const()[name = tensor("op_8306_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8306_cast_fp16 = slice_by_index(begin = var_8306_begin_0, end = var_8306_end_0, end_mask = var_8306_end_mask_0, x = transpose_12)[name = tensor("op_8306_cast_fp16")]; + tensor var_8310_begin_0 = const()[name = tensor("op_8310_begin_0"), val = tensor([0, 0, 0, 1216])]; + tensor var_8310_end_0 = const()[name = tensor("op_8310_end_0"), val = tensor([2, 77, 1, 1280])]; + tensor var_8310_end_mask_0 = const()[name = tensor("op_8310_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8310_cast_fp16 = slice_by_index(begin = var_8310_begin_0, end = var_8310_end_0, end_mask = var_8310_end_mask_0, x = transpose_12)[name = tensor("op_8310_cast_fp16")]; + tensor var_8312_begin_0 = const()[name = tensor("op_8312_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_8312_end_0 = const()[name = tensor("op_8312_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_8312_end_mask_0 = const()[name = tensor("op_8312_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8312_cast_fp16 = slice_by_index(begin = var_8312_begin_0, end = var_8312_end_0, end_mask = var_8312_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8312_cast_fp16")]; + tensor var_8316_begin_0 = const()[name = tensor("op_8316_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_8316_end_0 = const()[name = tensor("op_8316_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_8316_end_mask_0 = const()[name = tensor("op_8316_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8316_cast_fp16 = slice_by_index(begin = var_8316_begin_0, end = var_8316_end_0, end_mask = var_8316_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8316_cast_fp16")]; + tensor var_8320_begin_0 = const()[name = tensor("op_8320_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_8320_end_0 = const()[name = tensor("op_8320_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_8320_end_mask_0 = const()[name = tensor("op_8320_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8320_cast_fp16 = slice_by_index(begin = var_8320_begin_0, end = var_8320_end_0, end_mask = var_8320_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8320_cast_fp16")]; + tensor var_8324_begin_0 = const()[name = tensor("op_8324_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_8324_end_0 = const()[name = tensor("op_8324_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_8324_end_mask_0 = const()[name = tensor("op_8324_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8324_cast_fp16 = slice_by_index(begin = var_8324_begin_0, end = var_8324_end_0, end_mask = var_8324_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8324_cast_fp16")]; + tensor var_8328_begin_0 = const()[name = tensor("op_8328_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_8328_end_0 = const()[name = tensor("op_8328_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_8328_end_mask_0 = const()[name = tensor("op_8328_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8328_cast_fp16 = slice_by_index(begin = var_8328_begin_0, end = var_8328_end_0, end_mask = var_8328_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8328_cast_fp16")]; + tensor var_8332_begin_0 = const()[name = tensor("op_8332_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_8332_end_0 = const()[name = tensor("op_8332_end_0"), val = tensor([2, 384, 1, 77])]; + tensor var_8332_end_mask_0 = const()[name = tensor("op_8332_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8332_cast_fp16 = slice_by_index(begin = var_8332_begin_0, end = var_8332_end_0, end_mask = var_8332_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8332_cast_fp16")]; + tensor var_8336_begin_0 = const()[name = tensor("op_8336_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_8336_end_0 = const()[name = tensor("op_8336_end_0"), val = tensor([2, 448, 1, 77])]; + tensor var_8336_end_mask_0 = const()[name = tensor("op_8336_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8336_cast_fp16 = slice_by_index(begin = var_8336_begin_0, end = var_8336_end_0, end_mask = var_8336_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8336_cast_fp16")]; + tensor var_8340_begin_0 = const()[name = tensor("op_8340_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_8340_end_0 = const()[name = tensor("op_8340_end_0"), val = tensor([2, 512, 1, 77])]; + tensor var_8340_end_mask_0 = const()[name = tensor("op_8340_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8340_cast_fp16 = slice_by_index(begin = var_8340_begin_0, end = var_8340_end_0, end_mask = var_8340_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8340_cast_fp16")]; + tensor var_8344_begin_0 = const()[name = tensor("op_8344_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_8344_end_0 = const()[name = tensor("op_8344_end_0"), val = tensor([2, 576, 1, 77])]; + tensor var_8344_end_mask_0 = const()[name = tensor("op_8344_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8344_cast_fp16 = slice_by_index(begin = var_8344_begin_0, end = var_8344_end_0, end_mask = var_8344_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8344_cast_fp16")]; + tensor var_8348_begin_0 = const()[name = tensor("op_8348_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_8348_end_0 = const()[name = tensor("op_8348_end_0"), val = tensor([2, 640, 1, 77])]; + tensor var_8348_end_mask_0 = const()[name = tensor("op_8348_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8348_cast_fp16 = slice_by_index(begin = var_8348_begin_0, end = var_8348_end_0, end_mask = var_8348_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8348_cast_fp16")]; + tensor var_8352_begin_0 = const()[name = tensor("op_8352_begin_0"), val = tensor([0, 640, 0, 0])]; + tensor var_8352_end_0 = const()[name = tensor("op_8352_end_0"), val = tensor([2, 704, 1, 77])]; + tensor var_8352_end_mask_0 = const()[name = tensor("op_8352_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8352_cast_fp16 = slice_by_index(begin = var_8352_begin_0, end = var_8352_end_0, end_mask = var_8352_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8352_cast_fp16")]; + tensor var_8356_begin_0 = const()[name = tensor("op_8356_begin_0"), val = tensor([0, 704, 0, 0])]; + tensor var_8356_end_0 = const()[name = tensor("op_8356_end_0"), val = tensor([2, 768, 1, 77])]; + tensor var_8356_end_mask_0 = const()[name = tensor("op_8356_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8356_cast_fp16 = slice_by_index(begin = var_8356_begin_0, end = var_8356_end_0, end_mask = var_8356_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8356_cast_fp16")]; + tensor var_8360_begin_0 = const()[name = tensor("op_8360_begin_0"), val = tensor([0, 768, 0, 0])]; + tensor var_8360_end_0 = const()[name = tensor("op_8360_end_0"), val = tensor([2, 832, 1, 77])]; + tensor var_8360_end_mask_0 = const()[name = tensor("op_8360_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8360_cast_fp16 = slice_by_index(begin = var_8360_begin_0, end = var_8360_end_0, end_mask = var_8360_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8360_cast_fp16")]; + tensor var_8364_begin_0 = const()[name = tensor("op_8364_begin_0"), val = tensor([0, 832, 0, 0])]; + tensor var_8364_end_0 = const()[name = tensor("op_8364_end_0"), val = tensor([2, 896, 1, 77])]; + tensor var_8364_end_mask_0 = const()[name = tensor("op_8364_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8364_cast_fp16 = slice_by_index(begin = var_8364_begin_0, end = var_8364_end_0, end_mask = var_8364_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8364_cast_fp16")]; + tensor var_8368_begin_0 = const()[name = tensor("op_8368_begin_0"), val = tensor([0, 896, 0, 0])]; + tensor var_8368_end_0 = const()[name = tensor("op_8368_end_0"), val = tensor([2, 960, 1, 77])]; + tensor var_8368_end_mask_0 = const()[name = tensor("op_8368_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8368_cast_fp16 = slice_by_index(begin = var_8368_begin_0, end = var_8368_end_0, end_mask = var_8368_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8368_cast_fp16")]; + tensor var_8372_begin_0 = const()[name = tensor("op_8372_begin_0"), val = tensor([0, 960, 0, 0])]; + tensor var_8372_end_0 = const()[name = tensor("op_8372_end_0"), val = tensor([2, 1024, 1, 77])]; + tensor var_8372_end_mask_0 = const()[name = tensor("op_8372_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8372_cast_fp16 = slice_by_index(begin = var_8372_begin_0, end = var_8372_end_0, end_mask = var_8372_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8372_cast_fp16")]; + tensor var_8376_begin_0 = const()[name = tensor("op_8376_begin_0"), val = tensor([0, 1024, 0, 0])]; + tensor var_8376_end_0 = const()[name = tensor("op_8376_end_0"), val = tensor([2, 1088, 1, 77])]; + tensor var_8376_end_mask_0 = const()[name = tensor("op_8376_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8376_cast_fp16 = slice_by_index(begin = var_8376_begin_0, end = var_8376_end_0, end_mask = var_8376_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8376_cast_fp16")]; + tensor var_8380_begin_0 = const()[name = tensor("op_8380_begin_0"), val = tensor([0, 1088, 0, 0])]; + tensor var_8380_end_0 = const()[name = tensor("op_8380_end_0"), val = tensor([2, 1152, 1, 77])]; + tensor var_8380_end_mask_0 = const()[name = tensor("op_8380_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8380_cast_fp16 = slice_by_index(begin = var_8380_begin_0, end = var_8380_end_0, end_mask = var_8380_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8380_cast_fp16")]; + tensor var_8384_begin_0 = const()[name = tensor("op_8384_begin_0"), val = tensor([0, 1152, 0, 0])]; + tensor var_8384_end_0 = const()[name = tensor("op_8384_end_0"), val = tensor([2, 1216, 1, 77])]; + tensor var_8384_end_mask_0 = const()[name = tensor("op_8384_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8384_cast_fp16 = slice_by_index(begin = var_8384_begin_0, end = var_8384_end_0, end_mask = var_8384_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8384_cast_fp16")]; + tensor var_8388_begin_0 = const()[name = tensor("op_8388_begin_0"), val = tensor([0, 1216, 0, 0])]; + tensor var_8388_end_0 = const()[name = tensor("op_8388_end_0"), val = tensor([2, 1280, 1, 77])]; + tensor var_8388_end_mask_0 = const()[name = tensor("op_8388_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8388_cast_fp16 = slice_by_index(begin = var_8388_begin_0, end = var_8388_end_0, end_mask = var_8388_end_mask_0, x = v_39_cast_fp16)[name = tensor("op_8388_cast_fp16")]; + tensor var_8392_equation_0 = const()[name = tensor("op_8392_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8392_cast_fp16 = einsum(equation = var_8392_equation_0, values = (var_8234_cast_fp16, var_8151_cast_fp16))[name = tensor("op_8392_cast_fp16")]; + tensor var_8393_to_fp16 = const()[name = tensor("op_8393_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_561_cast_fp16 = mul(x = var_8392_cast_fp16, y = var_8393_to_fp16)[name = tensor("aw_561_cast_fp16")]; + tensor var_8396_equation_0 = const()[name = tensor("op_8396_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8396_cast_fp16 = einsum(equation = var_8396_equation_0, values = (var_8238_cast_fp16, var_8155_cast_fp16))[name = tensor("op_8396_cast_fp16")]; + tensor var_8397_to_fp16 = const()[name = tensor("op_8397_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_563_cast_fp16 = mul(x = var_8396_cast_fp16, y = var_8397_to_fp16)[name = tensor("aw_563_cast_fp16")]; + tensor var_8400_equation_0 = const()[name = tensor("op_8400_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8400_cast_fp16 = einsum(equation = var_8400_equation_0, values = (var_8242_cast_fp16, var_8159_cast_fp16))[name = tensor("op_8400_cast_fp16")]; + tensor var_8401_to_fp16 = const()[name = tensor("op_8401_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_565_cast_fp16 = mul(x = var_8400_cast_fp16, y = var_8401_to_fp16)[name = tensor("aw_565_cast_fp16")]; + tensor var_8404_equation_0 = const()[name = tensor("op_8404_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8404_cast_fp16 = einsum(equation = var_8404_equation_0, values = (var_8246_cast_fp16, var_8163_cast_fp16))[name = tensor("op_8404_cast_fp16")]; + tensor var_8405_to_fp16 = const()[name = tensor("op_8405_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_567_cast_fp16 = mul(x = var_8404_cast_fp16, y = var_8405_to_fp16)[name = tensor("aw_567_cast_fp16")]; + tensor var_8408_equation_0 = const()[name = tensor("op_8408_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8408_cast_fp16 = einsum(equation = var_8408_equation_0, values = (var_8250_cast_fp16, var_8167_cast_fp16))[name = tensor("op_8408_cast_fp16")]; + tensor var_8409_to_fp16 = const()[name = tensor("op_8409_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_569_cast_fp16 = mul(x = var_8408_cast_fp16, y = var_8409_to_fp16)[name = tensor("aw_569_cast_fp16")]; + tensor var_8412_equation_0 = const()[name = tensor("op_8412_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8412_cast_fp16 = einsum(equation = var_8412_equation_0, values = (var_8254_cast_fp16, var_8171_cast_fp16))[name = tensor("op_8412_cast_fp16")]; + tensor var_8413_to_fp16 = const()[name = tensor("op_8413_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_571_cast_fp16 = mul(x = var_8412_cast_fp16, y = var_8413_to_fp16)[name = tensor("aw_571_cast_fp16")]; + tensor var_8416_equation_0 = const()[name = tensor("op_8416_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8416_cast_fp16 = einsum(equation = var_8416_equation_0, values = (var_8258_cast_fp16, var_8175_cast_fp16))[name = tensor("op_8416_cast_fp16")]; + tensor var_8417_to_fp16 = const()[name = tensor("op_8417_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_573_cast_fp16 = mul(x = var_8416_cast_fp16, y = var_8417_to_fp16)[name = tensor("aw_573_cast_fp16")]; + tensor var_8420_equation_0 = const()[name = tensor("op_8420_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8420_cast_fp16 = einsum(equation = var_8420_equation_0, values = (var_8262_cast_fp16, var_8179_cast_fp16))[name = tensor("op_8420_cast_fp16")]; + tensor var_8421_to_fp16 = const()[name = tensor("op_8421_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_575_cast_fp16 = mul(x = var_8420_cast_fp16, y = var_8421_to_fp16)[name = tensor("aw_575_cast_fp16")]; + tensor var_8424_equation_0 = const()[name = tensor("op_8424_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8424_cast_fp16 = einsum(equation = var_8424_equation_0, values = (var_8266_cast_fp16, var_8183_cast_fp16))[name = tensor("op_8424_cast_fp16")]; + tensor var_8425_to_fp16 = const()[name = tensor("op_8425_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_577_cast_fp16 = mul(x = var_8424_cast_fp16, y = var_8425_to_fp16)[name = tensor("aw_577_cast_fp16")]; + tensor var_8428_equation_0 = const()[name = tensor("op_8428_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8428_cast_fp16 = einsum(equation = var_8428_equation_0, values = (var_8270_cast_fp16, var_8187_cast_fp16))[name = tensor("op_8428_cast_fp16")]; + tensor var_8429_to_fp16 = const()[name = tensor("op_8429_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_579_cast_fp16 = mul(x = var_8428_cast_fp16, y = var_8429_to_fp16)[name = tensor("aw_579_cast_fp16")]; + tensor var_8432_equation_0 = const()[name = tensor("op_8432_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8432_cast_fp16 = einsum(equation = var_8432_equation_0, values = (var_8274_cast_fp16, var_8191_cast_fp16))[name = tensor("op_8432_cast_fp16")]; + tensor var_8433_to_fp16 = const()[name = tensor("op_8433_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_581_cast_fp16 = mul(x = var_8432_cast_fp16, y = var_8433_to_fp16)[name = tensor("aw_581_cast_fp16")]; + tensor var_8436_equation_0 = const()[name = tensor("op_8436_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8436_cast_fp16 = einsum(equation = var_8436_equation_0, values = (var_8278_cast_fp16, var_8195_cast_fp16))[name = tensor("op_8436_cast_fp16")]; + tensor var_8437_to_fp16 = const()[name = tensor("op_8437_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_583_cast_fp16 = mul(x = var_8436_cast_fp16, y = var_8437_to_fp16)[name = tensor("aw_583_cast_fp16")]; + tensor var_8440_equation_0 = const()[name = tensor("op_8440_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8440_cast_fp16 = einsum(equation = var_8440_equation_0, values = (var_8282_cast_fp16, var_8199_cast_fp16))[name = tensor("op_8440_cast_fp16")]; + tensor var_8441_to_fp16 = const()[name = tensor("op_8441_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_585_cast_fp16 = mul(x = var_8440_cast_fp16, y = var_8441_to_fp16)[name = tensor("aw_585_cast_fp16")]; + tensor var_8444_equation_0 = const()[name = tensor("op_8444_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8444_cast_fp16 = einsum(equation = var_8444_equation_0, values = (var_8286_cast_fp16, var_8203_cast_fp16))[name = tensor("op_8444_cast_fp16")]; + tensor var_8445_to_fp16 = const()[name = tensor("op_8445_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_587_cast_fp16 = mul(x = var_8444_cast_fp16, y = var_8445_to_fp16)[name = tensor("aw_587_cast_fp16")]; + tensor var_8448_equation_0 = const()[name = tensor("op_8448_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8448_cast_fp16 = einsum(equation = var_8448_equation_0, values = (var_8290_cast_fp16, var_8207_cast_fp16))[name = tensor("op_8448_cast_fp16")]; + tensor var_8449_to_fp16 = const()[name = tensor("op_8449_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_589_cast_fp16 = mul(x = var_8448_cast_fp16, y = var_8449_to_fp16)[name = tensor("aw_589_cast_fp16")]; + tensor var_8452_equation_0 = const()[name = tensor("op_8452_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8452_cast_fp16 = einsum(equation = var_8452_equation_0, values = (var_8294_cast_fp16, var_8211_cast_fp16))[name = tensor("op_8452_cast_fp16")]; + tensor var_8453_to_fp16 = const()[name = tensor("op_8453_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_591_cast_fp16 = mul(x = var_8452_cast_fp16, y = var_8453_to_fp16)[name = tensor("aw_591_cast_fp16")]; + tensor var_8456_equation_0 = const()[name = tensor("op_8456_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8456_cast_fp16 = einsum(equation = var_8456_equation_0, values = (var_8298_cast_fp16, var_8215_cast_fp16))[name = tensor("op_8456_cast_fp16")]; + tensor var_8457_to_fp16 = const()[name = tensor("op_8457_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_593_cast_fp16 = mul(x = var_8456_cast_fp16, y = var_8457_to_fp16)[name = tensor("aw_593_cast_fp16")]; + tensor var_8460_equation_0 = const()[name = tensor("op_8460_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8460_cast_fp16 = einsum(equation = var_8460_equation_0, values = (var_8302_cast_fp16, var_8219_cast_fp16))[name = tensor("op_8460_cast_fp16")]; + tensor var_8461_to_fp16 = const()[name = tensor("op_8461_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_595_cast_fp16 = mul(x = var_8460_cast_fp16, y = var_8461_to_fp16)[name = tensor("aw_595_cast_fp16")]; + tensor var_8464_equation_0 = const()[name = tensor("op_8464_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8464_cast_fp16 = einsum(equation = var_8464_equation_0, values = (var_8306_cast_fp16, var_8223_cast_fp16))[name = tensor("op_8464_cast_fp16")]; + tensor var_8465_to_fp16 = const()[name = tensor("op_8465_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_597_cast_fp16 = mul(x = var_8464_cast_fp16, y = var_8465_to_fp16)[name = tensor("aw_597_cast_fp16")]; + tensor var_8468_equation_0 = const()[name = tensor("op_8468_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8468_cast_fp16 = einsum(equation = var_8468_equation_0, values = (var_8310_cast_fp16, var_8227_cast_fp16))[name = tensor("op_8468_cast_fp16")]; + tensor var_8469_to_fp16 = const()[name = tensor("op_8469_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_599_cast_fp16 = mul(x = var_8468_cast_fp16, y = var_8469_to_fp16)[name = tensor("aw_599_cast_fp16")]; + tensor var_8471_cast_fp16 = softmax(axis = var_5599, x = aw_561_cast_fp16)[name = tensor("op_8471_cast_fp16")]; + tensor var_8472_cast_fp16 = softmax(axis = var_5599, x = aw_563_cast_fp16)[name = tensor("op_8472_cast_fp16")]; + tensor var_8473_cast_fp16 = softmax(axis = var_5599, x = aw_565_cast_fp16)[name = tensor("op_8473_cast_fp16")]; + tensor var_8474_cast_fp16 = softmax(axis = var_5599, x = aw_567_cast_fp16)[name = tensor("op_8474_cast_fp16")]; + tensor var_8475_cast_fp16 = softmax(axis = var_5599, x = aw_569_cast_fp16)[name = tensor("op_8475_cast_fp16")]; + tensor var_8476_cast_fp16 = softmax(axis = var_5599, x = aw_571_cast_fp16)[name = tensor("op_8476_cast_fp16")]; + tensor var_8477_cast_fp16 = softmax(axis = var_5599, x = aw_573_cast_fp16)[name = tensor("op_8477_cast_fp16")]; + tensor var_8478_cast_fp16 = softmax(axis = var_5599, x = aw_575_cast_fp16)[name = tensor("op_8478_cast_fp16")]; + tensor var_8479_cast_fp16 = softmax(axis = var_5599, x = aw_577_cast_fp16)[name = tensor("op_8479_cast_fp16")]; + tensor var_8480_cast_fp16 = softmax(axis = var_5599, x = aw_579_cast_fp16)[name = tensor("op_8480_cast_fp16")]; + tensor var_8481_cast_fp16 = softmax(axis = var_5599, x = aw_581_cast_fp16)[name = tensor("op_8481_cast_fp16")]; + tensor var_8482_cast_fp16 = softmax(axis = var_5599, x = aw_583_cast_fp16)[name = tensor("op_8482_cast_fp16")]; + tensor var_8483_cast_fp16 = softmax(axis = var_5599, x = aw_585_cast_fp16)[name = tensor("op_8483_cast_fp16")]; + tensor var_8484_cast_fp16 = softmax(axis = var_5599, x = aw_587_cast_fp16)[name = tensor("op_8484_cast_fp16")]; + tensor var_8485_cast_fp16 = softmax(axis = var_5599, x = aw_589_cast_fp16)[name = tensor("op_8485_cast_fp16")]; + tensor var_8486_cast_fp16 = softmax(axis = var_5599, x = aw_591_cast_fp16)[name = tensor("op_8486_cast_fp16")]; + tensor var_8487_cast_fp16 = softmax(axis = var_5599, x = aw_593_cast_fp16)[name = tensor("op_8487_cast_fp16")]; + tensor var_8488_cast_fp16 = softmax(axis = var_5599, x = aw_595_cast_fp16)[name = tensor("op_8488_cast_fp16")]; + tensor var_8489_cast_fp16 = softmax(axis = var_5599, x = aw_597_cast_fp16)[name = tensor("op_8489_cast_fp16")]; + tensor var_8490_cast_fp16 = softmax(axis = var_5599, x = aw_599_cast_fp16)[name = tensor("op_8490_cast_fp16")]; + tensor var_8492_equation_0 = const()[name = tensor("op_8492_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8492_cast_fp16 = einsum(equation = var_8492_equation_0, values = (var_8312_cast_fp16, var_8471_cast_fp16))[name = tensor("op_8492_cast_fp16")]; + tensor var_8494_equation_0 = const()[name = tensor("op_8494_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8494_cast_fp16 = einsum(equation = var_8494_equation_0, values = (var_8316_cast_fp16, var_8472_cast_fp16))[name = tensor("op_8494_cast_fp16")]; + tensor var_8496_equation_0 = const()[name = tensor("op_8496_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8496_cast_fp16 = einsum(equation = var_8496_equation_0, values = (var_8320_cast_fp16, var_8473_cast_fp16))[name = tensor("op_8496_cast_fp16")]; + tensor var_8498_equation_0 = const()[name = tensor("op_8498_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8498_cast_fp16 = einsum(equation = var_8498_equation_0, values = (var_8324_cast_fp16, var_8474_cast_fp16))[name = tensor("op_8498_cast_fp16")]; + tensor var_8500_equation_0 = const()[name = tensor("op_8500_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8500_cast_fp16 = einsum(equation = var_8500_equation_0, values = (var_8328_cast_fp16, var_8475_cast_fp16))[name = tensor("op_8500_cast_fp16")]; + tensor var_8502_equation_0 = const()[name = tensor("op_8502_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8502_cast_fp16 = einsum(equation = var_8502_equation_0, values = (var_8332_cast_fp16, var_8476_cast_fp16))[name = tensor("op_8502_cast_fp16")]; + tensor var_8504_equation_0 = const()[name = tensor("op_8504_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8504_cast_fp16 = einsum(equation = var_8504_equation_0, values = (var_8336_cast_fp16, var_8477_cast_fp16))[name = tensor("op_8504_cast_fp16")]; + tensor var_8506_equation_0 = const()[name = tensor("op_8506_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8506_cast_fp16 = einsum(equation = var_8506_equation_0, values = (var_8340_cast_fp16, var_8478_cast_fp16))[name = tensor("op_8506_cast_fp16")]; + tensor var_8508_equation_0 = const()[name = tensor("op_8508_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8508_cast_fp16 = einsum(equation = var_8508_equation_0, values = (var_8344_cast_fp16, var_8479_cast_fp16))[name = tensor("op_8508_cast_fp16")]; + tensor var_8510_equation_0 = const()[name = tensor("op_8510_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8510_cast_fp16 = einsum(equation = var_8510_equation_0, values = (var_8348_cast_fp16, var_8480_cast_fp16))[name = tensor("op_8510_cast_fp16")]; + tensor var_8512_equation_0 = const()[name = tensor("op_8512_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8512_cast_fp16 = einsum(equation = var_8512_equation_0, values = (var_8352_cast_fp16, var_8481_cast_fp16))[name = tensor("op_8512_cast_fp16")]; + tensor var_8514_equation_0 = const()[name = tensor("op_8514_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8514_cast_fp16 = einsum(equation = var_8514_equation_0, values = (var_8356_cast_fp16, var_8482_cast_fp16))[name = tensor("op_8514_cast_fp16")]; + tensor var_8516_equation_0 = const()[name = tensor("op_8516_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8516_cast_fp16 = einsum(equation = var_8516_equation_0, values = (var_8360_cast_fp16, var_8483_cast_fp16))[name = tensor("op_8516_cast_fp16")]; + tensor var_8518_equation_0 = const()[name = tensor("op_8518_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8518_cast_fp16 = einsum(equation = var_8518_equation_0, values = (var_8364_cast_fp16, var_8484_cast_fp16))[name = tensor("op_8518_cast_fp16")]; + tensor var_8520_equation_0 = const()[name = tensor("op_8520_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8520_cast_fp16 = einsum(equation = var_8520_equation_0, values = (var_8368_cast_fp16, var_8485_cast_fp16))[name = tensor("op_8520_cast_fp16")]; + tensor var_8522_equation_0 = const()[name = tensor("op_8522_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8522_cast_fp16 = einsum(equation = var_8522_equation_0, values = (var_8372_cast_fp16, var_8486_cast_fp16))[name = tensor("op_8522_cast_fp16")]; + tensor var_8524_equation_0 = const()[name = tensor("op_8524_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8524_cast_fp16 = einsum(equation = var_8524_equation_0, values = (var_8376_cast_fp16, var_8487_cast_fp16))[name = tensor("op_8524_cast_fp16")]; + tensor var_8526_equation_0 = const()[name = tensor("op_8526_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8526_cast_fp16 = einsum(equation = var_8526_equation_0, values = (var_8380_cast_fp16, var_8488_cast_fp16))[name = tensor("op_8526_cast_fp16")]; + tensor var_8528_equation_0 = const()[name = tensor("op_8528_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8528_cast_fp16 = einsum(equation = var_8528_equation_0, values = (var_8384_cast_fp16, var_8489_cast_fp16))[name = tensor("op_8528_cast_fp16")]; + tensor var_8530_equation_0 = const()[name = tensor("op_8530_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8530_cast_fp16 = einsum(equation = var_8530_equation_0, values = (var_8388_cast_fp16, var_8490_cast_fp16))[name = tensor("op_8530_cast_fp16")]; + tensor input_355_interleave_0 = const()[name = tensor("input_355_interleave_0"), val = tensor(false)]; + tensor input_355_cast_fp16 = concat(axis = var_5599, interleave = input_355_interleave_0, values = (var_8492_cast_fp16, var_8494_cast_fp16, var_8496_cast_fp16, var_8498_cast_fp16, var_8500_cast_fp16, var_8502_cast_fp16, var_8504_cast_fp16, var_8506_cast_fp16, var_8508_cast_fp16, var_8510_cast_fp16, var_8512_cast_fp16, var_8514_cast_fp16, var_8516_cast_fp16, var_8518_cast_fp16, var_8520_cast_fp16, var_8522_cast_fp16, var_8524_cast_fp16, var_8526_cast_fp16, var_8528_cast_fp16, var_8530_cast_fp16))[name = tensor("input_355_cast_fp16")]; + tensor var_8536 = const()[name = tensor("op_8536"), val = tensor([1, 1])]; + tensor var_8538 = const()[name = tensor("op_8538"), val = tensor([1, 1])]; + tensor var_8540_pad_type_0 = const()[name = tensor("op_8540_pad_type_0"), val = tensor("custom")]; + tensor var_8540_pad_0 = const()[name = tensor("op_8540_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1473054528)))]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1476331392)))]; + tensor var_8540_cast_fp16 = conv(bias = up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_8538, groups = var_5599, pad = var_8540_pad_0, pad_type = var_8540_pad_type_0, strides = var_8536, weight = up_blocks_1_attentions_2_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_355_cast_fp16)[name = tensor("op_8540_cast_fp16")]; + tensor inputs_59_cast_fp16 = add(x = var_8540_cast_fp16, y = inputs_57_cast_fp16)[name = tensor("inputs_59_cast_fp16")]; + tensor var_8544 = const()[name = tensor("op_8544"), val = tensor([1])]; + tensor channels_mean_59_cast_fp16 = reduce_mean(axes = var_8544, keep_dims = var_5594, x = inputs_59_cast_fp16)[name = tensor("channels_mean_59_cast_fp16")]; + tensor zero_mean_59_cast_fp16 = sub(x = inputs_59_cast_fp16, y = channels_mean_59_cast_fp16)[name = tensor("zero_mean_59_cast_fp16")]; + tensor zero_mean_sq_59_cast_fp16 = mul(x = zero_mean_59_cast_fp16, y = zero_mean_59_cast_fp16)[name = tensor("zero_mean_sq_59_cast_fp16")]; + tensor var_8548 = const()[name = tensor("op_8548"), val = tensor([1])]; + tensor var_8549_cast_fp16 = reduce_mean(axes = var_8548, keep_dims = var_5594, x = zero_mean_sq_59_cast_fp16)[name = tensor("op_8549_cast_fp16")]; + tensor var_8550_to_fp16 = const()[name = tensor("op_8550_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_8551_cast_fp16 = add(x = var_8549_cast_fp16, y = var_8550_to_fp16)[name = tensor("op_8551_cast_fp16")]; + tensor denom_59_epsilon_0_to_fp16 = const()[name = tensor("denom_59_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_59_cast_fp16 = rsqrt(epsilon = denom_59_epsilon_0_to_fp16, x = var_8551_cast_fp16)[name = tensor("denom_59_cast_fp16")]; + tensor out_59_cast_fp16 = mul(x = zero_mean_59_cast_fp16, y = denom_59_cast_fp16)[name = tensor("out_59_cast_fp16")]; + tensor var_8555_to_fp16 = const()[name = tensor("op_8555_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1476334016)))]; + tensor var_8556_cast_fp16 = add(x = out_59_cast_fp16, y = var_8555_to_fp16)[name = tensor("op_8556_cast_fp16")]; + tensor var_8558_to_fp16 = const()[name = tensor("op_8558_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1476336640)))]; + tensor input_357_cast_fp16 = mul(x = var_8556_cast_fp16, y = var_8558_to_fp16)[name = tensor("input_357_cast_fp16")]; + tensor var_8566 = const()[name = tensor("op_8566"), val = tensor([1, 1])]; + tensor var_8568 = const()[name = tensor("op_8568"), val = tensor([1, 1])]; + tensor var_8570_pad_type_0 = const()[name = tensor("op_8570_pad_type_0"), val = tensor("custom")]; + tensor var_8570_pad_0 = const()[name = tensor("op_8570_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1476339264)))]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1502553728)))]; + tensor var_8570_cast_fp16 = conv(bias = up_blocks_1_attentions_2_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_8568, groups = var_5599, pad = var_8570_pad_0, pad_type = var_8570_pad_type_0, strides = var_8566, weight = up_blocks_1_attentions_2_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_357_cast_fp16)[name = tensor("op_8570_cast_fp16")]; + tensor var_8571_split_sizes_0 = const()[name = tensor("op_8571_split_sizes_0"), val = tensor([5120, 5120])]; + tensor var_8571_axis_0 = const()[name = tensor("op_8571_axis_0"), val = tensor(1)]; + tensor var_8571_cast_fp16_0, tensor var_8571_cast_fp16_1 = split(axis = var_8571_axis_0, split_sizes = var_8571_split_sizes_0, x = var_8570_cast_fp16)[name = tensor("op_8571_cast_fp16")]; + tensor var_8573_mode_0 = const()[name = tensor("op_8573_mode_0"), val = tensor("EXACT")]; + tensor var_8573_cast_fp16 = gelu(mode = var_8573_mode_0, x = var_8571_cast_fp16_1)[name = tensor("op_8573_cast_fp16")]; + tensor input_359_cast_fp16 = mul(x = var_8571_cast_fp16_0, y = var_8573_cast_fp16)[name = tensor("input_359_cast_fp16")]; + tensor var_8577 = const()[name = tensor("op_8577"), val = tensor([1, 1])]; + tensor var_8579 = const()[name = tensor("op_8579"), val = tensor([1, 1])]; + tensor var_8581_pad_type_0 = const()[name = tensor("op_8581_pad_type_0"), val = tensor("custom")]; + tensor var_8581_pad_0 = const()[name = tensor("op_8581_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1502574272)))]; + tensor up_blocks_1_attentions_2_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1515681536)))]; + tensor var_8581_cast_fp16 = conv(bias = up_blocks_1_attentions_2_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_8579, groups = var_5599, pad = var_8581_pad_0, pad_type = var_8581_pad_type_0, strides = var_8577, weight = up_blocks_1_attentions_2_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_359_cast_fp16)[name = tensor("op_8581_cast_fp16")]; + tensor hidden_states_213_cast_fp16 = add(x = var_8581_cast_fp16, y = inputs_59_cast_fp16)[name = tensor("hidden_states_213_cast_fp16")]; + tensor var_8583 = const()[name = tensor("op_8583"), val = tensor([2, 1280, 12, 12])]; + tensor input_361_cast_fp16 = reshape(shape = var_8583, x = hidden_states_213_cast_fp16)[name = tensor("input_361_cast_fp16")]; + tensor var_8587 = const()[name = tensor("op_8587"), val = tensor([1, 1])]; + tensor var_8589 = const()[name = tensor("op_8589"), val = tensor([1, 1])]; + tensor hidden_states_215_pad_type_0 = const()[name = tensor("hidden_states_215_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_215_pad_0 = const()[name = tensor("hidden_states_215_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_1_attentions_2_proj_out_weight_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1515684160)))]; + tensor up_blocks_1_attentions_2_proj_out_bias_to_fp16 = const()[name = tensor("up_blocks_1_attentions_2_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1518961024)))]; + tensor hidden_states_215_cast_fp16 = conv(bias = up_blocks_1_attentions_2_proj_out_bias_to_fp16, dilations = var_8589, groups = var_5599, pad = hidden_states_215_pad_0, pad_type = hidden_states_215_pad_type_0, strides = var_8587, weight = up_blocks_1_attentions_2_proj_out_weight_to_fp16, x = input_361_cast_fp16)[name = tensor("hidden_states_215_cast_fp16")]; + tensor input_363_cast_fp16 = add(x = hidden_states_215_cast_fp16, y = hidden_states_203_cast_fp16)[name = tensor("input_363_cast_fp16")]; + tensor input_365_scale_factor_height_0 = const()[name = tensor("input_365_scale_factor_height_0"), val = tensor(0x1p+1)]; + tensor input_365_scale_factor_width_0 = const()[name = tensor("input_365_scale_factor_width_0"), val = tensor(0x1p+1)]; + tensor input_365_cast_fp16 = upsample_nearest_neighbor(scale_factor_height = input_365_scale_factor_height_0, scale_factor_width = input_365_scale_factor_width_0, x = input_363_cast_fp16)[name = tensor("input_365_cast_fp16")]; + tensor var_8598 = const()[name = tensor("op_8598"), val = tensor([1, 1])]; + tensor var_8600 = const()[name = tensor("op_8600"), val = tensor([1, 1])]; + tensor hidden_states_217_pad_type_0 = const()[name = tensor("hidden_states_217_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_217_pad_0 = const()[name = tensor("hidden_states_217_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_1_upsamplers_0_conv_weight_to_fp16 = const()[name = tensor("up_blocks_1_upsamplers_0_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1518963648)))]; + tensor up_blocks_1_upsamplers_0_conv_bias_to_fp16 = const()[name = tensor("up_blocks_1_upsamplers_0_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1548454912)))]; + tensor hidden_states_217_cast_fp16 = conv(bias = up_blocks_1_upsamplers_0_conv_bias_to_fp16, dilations = var_8600, groups = var_5599, pad = hidden_states_217_pad_0, pad_type = hidden_states_217_pad_type_0, strides = var_8598, weight = up_blocks_1_upsamplers_0_conv_weight_to_fp16, x = input_365_cast_fp16)[name = tensor("hidden_states_217_cast_fp16")]; + tensor var_8622 = const()[name = tensor("op_8622"), val = tensor(true)]; + tensor var_8627 = const()[name = tensor("op_8627"), val = tensor(1)]; + tensor input_367_interleave_0 = const()[name = tensor("input_367_interleave_0"), val = tensor(false)]; + tensor input_367_cast_fp16 = concat(axis = var_8627, interleave = input_367_interleave_0, values = (hidden_states_217_cast_fp16, input_115_cast_fp16))[name = tensor("input_367_cast_fp16")]; + tensor reshape_168_shape_0 = const()[name = tensor("reshape_168_shape_0"), val = tensor([2, 32, 60, 24, 24])]; + tensor reshape_168_cast_fp16 = reshape(shape = reshape_168_shape_0, x = input_367_cast_fp16)[name = tensor("reshape_168_cast_fp16")]; + tensor reduce_mean_126_axes_0 = const()[name = tensor("reduce_mean_126_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_126_keep_dims_0 = const()[name = tensor("reduce_mean_126_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_126_cast_fp16 = reduce_mean(axes = reduce_mean_126_axes_0, keep_dims = reduce_mean_126_keep_dims_0, x = reshape_168_cast_fp16)[name = tensor("reduce_mean_126_cast_fp16")]; + tensor sub_84_cast_fp16 = sub(x = reshape_168_cast_fp16, y = reduce_mean_126_cast_fp16)[name = tensor("sub_84_cast_fp16")]; + tensor square_42_cast_fp16 = square(x = sub_84_cast_fp16)[name = tensor("square_42_cast_fp16")]; + tensor reduce_mean_128_axes_0 = const()[name = tensor("reduce_mean_128_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_128_keep_dims_0 = const()[name = tensor("reduce_mean_128_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_128_cast_fp16 = reduce_mean(axes = reduce_mean_128_axes_0, keep_dims = reduce_mean_128_keep_dims_0, x = square_42_cast_fp16)[name = tensor("reduce_mean_128_cast_fp16")]; + tensor add_84_y_0_to_fp16 = const()[name = tensor("add_84_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_84_cast_fp16 = add(x = reduce_mean_128_cast_fp16, y = add_84_y_0_to_fp16)[name = tensor("add_84_cast_fp16")]; + tensor sqrt_42_cast_fp16 = sqrt(x = add_84_cast_fp16)[name = tensor("sqrt_42_cast_fp16")]; + tensor real_div_42_cast_fp16 = real_div(x = sub_84_cast_fp16, y = sqrt_42_cast_fp16)[name = tensor("real_div_42_cast_fp16")]; + tensor reshape_169_shape_0 = const()[name = tensor("reshape_169_shape_0"), val = tensor([2, 1920, 24, 24])]; + tensor reshape_169_cast_fp16 = reshape(shape = reshape_169_shape_0, x = real_div_42_cast_fp16)[name = tensor("reshape_169_cast_fp16")]; + tensor add_85_gamma_0_to_fp16 = const()[name = tensor("add_85_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1548457536)))]; + tensor add_85_beta_0_to_fp16 = const()[name = tensor("add_85_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1548461440)))]; + tensor add_85_epsilon_0_to_fp16 = const()[name = tensor("add_85_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_85_cast_fp16 = batch_norm(beta = add_85_beta_0_to_fp16, epsilon = add_85_epsilon_0_to_fp16, gamma = add_85_gamma_0_to_fp16, mean = add_79_mean_0_to_fp16, variance = add_79_variance_0_to_fp16, x = reshape_169_cast_fp16)[name = tensor("add_85_cast_fp16")]; + tensor input_371_cast_fp16 = silu(x = add_85_cast_fp16)[name = tensor("input_371_cast_fp16")]; + tensor var_8656 = const()[name = tensor("op_8656"), val = tensor([1, 1])]; + tensor var_8658 = const()[name = tensor("op_8658"), val = tensor([1, 1])]; + tensor hidden_states_219_pad_type_0 = const()[name = tensor("hidden_states_219_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_219_pad_0 = const()[name = tensor("hidden_states_219_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_2_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1548465344)))]; + tensor up_blocks_2_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1570583808)))]; + tensor hidden_states_219_cast_fp16 = conv(bias = up_blocks_2_resnets_0_conv1_bias_to_fp16, dilations = var_8658, groups = var_8627, pad = hidden_states_219_pad_0, pad_type = hidden_states_219_pad_type_0, strides = var_8656, weight = up_blocks_2_resnets_0_conv1_weight_to_fp16, x = input_371_cast_fp16)[name = tensor("hidden_states_219_cast_fp16")]; + tensor var_8664 = const()[name = tensor("op_8664"), val = tensor([1, 1])]; + tensor var_8666 = const()[name = tensor("op_8666"), val = tensor([1, 1])]; + tensor temb_33_pad_type_0 = const()[name = tensor("temb_33_pad_type_0"), val = tensor("custom")]; + tensor temb_33_pad_0 = const()[name = tensor("temb_33_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1570585152)))]; + tensor up_blocks_2_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1572223616)))]; + tensor temb_33_cast_fp16 = conv(bias = up_blocks_2_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_8666, groups = var_8627, pad = temb_33_pad_0, pad_type = temb_33_pad_type_0, strides = var_8664, weight = up_blocks_2_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_33_cast_fp16")]; + tensor input_375_cast_fp16 = add(x = hidden_states_219_cast_fp16, y = temb_33_cast_fp16)[name = tensor("input_375_cast_fp16")]; + tensor reshape_172_shape_0 = const()[name = tensor("reshape_172_shape_0"), val = tensor([2, 32, 20, 24, 24])]; + tensor reshape_172_cast_fp16 = reshape(shape = reshape_172_shape_0, x = input_375_cast_fp16)[name = tensor("reshape_172_cast_fp16")]; + tensor reduce_mean_129_axes_0 = const()[name = tensor("reduce_mean_129_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_129_keep_dims_0 = const()[name = tensor("reduce_mean_129_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_129_cast_fp16 = reduce_mean(axes = reduce_mean_129_axes_0, keep_dims = reduce_mean_129_keep_dims_0, x = reshape_172_cast_fp16)[name = tensor("reduce_mean_129_cast_fp16")]; + tensor sub_86_cast_fp16 = sub(x = reshape_172_cast_fp16, y = reduce_mean_129_cast_fp16)[name = tensor("sub_86_cast_fp16")]; + tensor square_43_cast_fp16 = square(x = sub_86_cast_fp16)[name = tensor("square_43_cast_fp16")]; + tensor reduce_mean_131_axes_0 = const()[name = tensor("reduce_mean_131_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_131_keep_dims_0 = const()[name = tensor("reduce_mean_131_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_131_cast_fp16 = reduce_mean(axes = reduce_mean_131_axes_0, keep_dims = reduce_mean_131_keep_dims_0, x = square_43_cast_fp16)[name = tensor("reduce_mean_131_cast_fp16")]; + tensor add_86_y_0_to_fp16 = const()[name = tensor("add_86_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_86_cast_fp16 = add(x = reduce_mean_131_cast_fp16, y = add_86_y_0_to_fp16)[name = tensor("add_86_cast_fp16")]; + tensor sqrt_43_cast_fp16 = sqrt(x = add_86_cast_fp16)[name = tensor("sqrt_43_cast_fp16")]; + tensor real_div_43_cast_fp16 = real_div(x = sub_86_cast_fp16, y = sqrt_43_cast_fp16)[name = tensor("real_div_43_cast_fp16")]; + tensor reshape_173_shape_0 = const()[name = tensor("reshape_173_shape_0"), val = tensor([2, 640, 24, 24])]; + tensor reshape_173_cast_fp16 = reshape(shape = reshape_173_shape_0, x = real_div_43_cast_fp16)[name = tensor("reshape_173_cast_fp16")]; + tensor add_87_gamma_0_to_fp16 = const()[name = tensor("add_87_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1572224960)))]; + tensor add_87_beta_0_to_fp16 = const()[name = tensor("add_87_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1572226304)))]; + tensor add_87_epsilon_0_to_fp16 = const()[name = tensor("add_87_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_87_cast_fp16 = batch_norm(beta = add_87_beta_0_to_fp16, epsilon = add_87_epsilon_0_to_fp16, gamma = add_87_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_173_cast_fp16)[name = tensor("add_87_cast_fp16")]; + tensor input_379_cast_fp16 = silu(x = add_87_cast_fp16)[name = tensor("input_379_cast_fp16")]; + tensor var_8676 = const()[name = tensor("op_8676"), val = tensor([1, 1])]; + tensor var_8678 = const()[name = tensor("op_8678"), val = tensor([1, 1])]; + tensor hidden_states_221_pad_type_0 = const()[name = tensor("hidden_states_221_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_221_pad_0 = const()[name = tensor("hidden_states_221_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_2_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1572227648)))]; + tensor up_blocks_2_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1579600512)))]; + tensor hidden_states_221_cast_fp16 = conv(bias = up_blocks_2_resnets_0_conv2_bias_to_fp16, dilations = var_8678, groups = var_8627, pad = hidden_states_221_pad_0, pad_type = hidden_states_221_pad_type_0, strides = var_8676, weight = up_blocks_2_resnets_0_conv2_weight_to_fp16, x = input_379_cast_fp16)[name = tensor("hidden_states_221_cast_fp16")]; + tensor var_8683 = const()[name = tensor("op_8683"), val = tensor([1, 1])]; + tensor var_8685 = const()[name = tensor("op_8685"), val = tensor([1, 1])]; + tensor x_17_pad_type_0 = const()[name = tensor("x_17_pad_type_0"), val = tensor("custom")]; + tensor x_17_pad_0 = const()[name = tensor("x_17_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_resnets_0_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_0_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1579601856)))]; + tensor up_blocks_2_resnets_0_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_0_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1582059520)))]; + tensor x_17_cast_fp16 = conv(bias = up_blocks_2_resnets_0_conv_shortcut_bias_to_fp16, dilations = var_8685, groups = var_8627, pad = x_17_pad_0, pad_type = x_17_pad_type_0, strides = var_8683, weight = up_blocks_2_resnets_0_conv_shortcut_weight_to_fp16, x = input_367_cast_fp16)[name = tensor("x_17_cast_fp16")]; + tensor hidden_states_223_cast_fp16 = add(x = x_17_cast_fp16, y = hidden_states_221_cast_fp16)[name = tensor("hidden_states_223_cast_fp16")]; + tensor reshape_176_shape_0 = const()[name = tensor("reshape_176_shape_0"), val = tensor([2, 32, 20, 24, 24])]; + tensor reshape_176_cast_fp16 = reshape(shape = reshape_176_shape_0, x = hidden_states_223_cast_fp16)[name = tensor("reshape_176_cast_fp16")]; + tensor reduce_mean_132_axes_0 = const()[name = tensor("reduce_mean_132_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_132_keep_dims_0 = const()[name = tensor("reduce_mean_132_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_132_cast_fp16 = reduce_mean(axes = reduce_mean_132_axes_0, keep_dims = reduce_mean_132_keep_dims_0, x = reshape_176_cast_fp16)[name = tensor("reduce_mean_132_cast_fp16")]; + tensor sub_88_cast_fp16 = sub(x = reshape_176_cast_fp16, y = reduce_mean_132_cast_fp16)[name = tensor("sub_88_cast_fp16")]; + tensor square_44_cast_fp16 = square(x = sub_88_cast_fp16)[name = tensor("square_44_cast_fp16")]; + tensor reduce_mean_134_axes_0 = const()[name = tensor("reduce_mean_134_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_134_keep_dims_0 = const()[name = tensor("reduce_mean_134_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_134_cast_fp16 = reduce_mean(axes = reduce_mean_134_axes_0, keep_dims = reduce_mean_134_keep_dims_0, x = square_44_cast_fp16)[name = tensor("reduce_mean_134_cast_fp16")]; + tensor add_88_y_0_to_fp16 = const()[name = tensor("add_88_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_88_cast_fp16 = add(x = reduce_mean_134_cast_fp16, y = add_88_y_0_to_fp16)[name = tensor("add_88_cast_fp16")]; + tensor sqrt_44_cast_fp16 = sqrt(x = add_88_cast_fp16)[name = tensor("sqrt_44_cast_fp16")]; + tensor real_div_44_cast_fp16 = real_div(x = sub_88_cast_fp16, y = sqrt_44_cast_fp16)[name = tensor("real_div_44_cast_fp16")]; + tensor reshape_177_shape_0 = const()[name = tensor("reshape_177_shape_0"), val = tensor([2, 640, 24, 24])]; + tensor reshape_177_cast_fp16 = reshape(shape = reshape_177_shape_0, x = real_div_44_cast_fp16)[name = tensor("reshape_177_cast_fp16")]; + tensor add_89_gamma_0_to_fp16 = const()[name = tensor("add_89_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1582060864)))]; + tensor add_89_beta_0_to_fp16 = const()[name = tensor("add_89_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1582062208)))]; + tensor add_89_epsilon_0_to_fp16 = const()[name = tensor("add_89_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_89_cast_fp16 = batch_norm(beta = add_89_beta_0_to_fp16, epsilon = add_89_epsilon_0_to_fp16, gamma = add_89_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_177_cast_fp16)[name = tensor("add_89_cast_fp16")]; + tensor var_8705 = const()[name = tensor("op_8705"), val = tensor([1, 1])]; + tensor var_8707 = const()[name = tensor("op_8707"), val = tensor([1, 1])]; + tensor hidden_states_225_pad_type_0 = const()[name = tensor("hidden_states_225_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_225_pad_0 = const()[name = tensor("hidden_states_225_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_proj_in_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1582063552)))]; + tensor up_blocks_2_attentions_0_proj_in_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1582882816)))]; + tensor hidden_states_225_cast_fp16 = conv(bias = up_blocks_2_attentions_0_proj_in_bias_to_fp16, dilations = var_8707, groups = var_8627, pad = hidden_states_225_pad_0, pad_type = hidden_states_225_pad_type_0, strides = var_8705, weight = up_blocks_2_attentions_0_proj_in_weight_to_fp16, x = add_89_cast_fp16)[name = tensor("hidden_states_225_cast_fp16")]; + tensor var_8712 = const()[name = tensor("op_8712"), val = tensor([2, 640, 1, 576])]; + tensor inputs_61_cast_fp16 = reshape(shape = var_8712, x = hidden_states_225_cast_fp16)[name = tensor("inputs_61_cast_fp16")]; + tensor var_8722 = const()[name = tensor("op_8722"), val = tensor([1])]; + tensor channels_mean_61_cast_fp16 = reduce_mean(axes = var_8722, keep_dims = var_8622, x = inputs_61_cast_fp16)[name = tensor("channels_mean_61_cast_fp16")]; + tensor zero_mean_61_cast_fp16 = sub(x = inputs_61_cast_fp16, y = channels_mean_61_cast_fp16)[name = tensor("zero_mean_61_cast_fp16")]; + tensor zero_mean_sq_61_cast_fp16 = mul(x = zero_mean_61_cast_fp16, y = zero_mean_61_cast_fp16)[name = tensor("zero_mean_sq_61_cast_fp16")]; + tensor var_8726 = const()[name = tensor("op_8726"), val = tensor([1])]; + tensor var_8727_cast_fp16 = reduce_mean(axes = var_8726, keep_dims = var_8622, x = zero_mean_sq_61_cast_fp16)[name = tensor("op_8727_cast_fp16")]; + tensor var_8728_to_fp16 = const()[name = tensor("op_8728_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_8729_cast_fp16 = add(x = var_8727_cast_fp16, y = var_8728_to_fp16)[name = tensor("op_8729_cast_fp16")]; + tensor denom_61_epsilon_0_to_fp16 = const()[name = tensor("denom_61_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_61_cast_fp16 = rsqrt(epsilon = denom_61_epsilon_0_to_fp16, x = var_8729_cast_fp16)[name = tensor("denom_61_cast_fp16")]; + tensor out_61_cast_fp16 = mul(x = zero_mean_61_cast_fp16, y = denom_61_cast_fp16)[name = tensor("out_61_cast_fp16")]; + tensor var_8733_to_fp16 = const()[name = tensor("op_8733_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1582884160)))]; + tensor var_8734_cast_fp16 = add(x = out_61_cast_fp16, y = var_8733_to_fp16)[name = tensor("op_8734_cast_fp16")]; + tensor var_8736_to_fp16 = const()[name = tensor("op_8736_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1582885504)))]; + tensor hidden_states_227_cast_fp16 = mul(x = var_8734_cast_fp16, y = var_8736_to_fp16)[name = tensor("hidden_states_227_cast_fp16")]; + tensor var_8743 = const()[name = tensor("op_8743"), val = tensor([1, 1])]; + tensor var_8745 = const()[name = tensor("op_8745"), val = tensor([1, 1])]; + tensor q_41_pad_type_0 = const()[name = tensor("q_41_pad_type_0"), val = tensor("custom")]; + tensor q_41_pad_0 = const()[name = tensor("q_41_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1582886848)))]; + tensor q_41_cast_fp16 = conv(dilations = var_8745, groups = var_8627, pad = q_41_pad_0, pad_type = q_41_pad_type_0, strides = var_8743, weight = up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_227_cast_fp16)[name = tensor("q_41_cast_fp16")]; + tensor var_8749 = const()[name = tensor("op_8749"), val = tensor([1, 1])]; + tensor var_8751 = const()[name = tensor("op_8751"), val = tensor([1, 1])]; + tensor k_81_pad_type_0 = const()[name = tensor("k_81_pad_type_0"), val = tensor("custom")]; + tensor k_81_pad_0 = const()[name = tensor("k_81_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1583706112)))]; + tensor k_81_cast_fp16 = conv(dilations = var_8751, groups = var_8627, pad = k_81_pad_0, pad_type = k_81_pad_type_0, strides = var_8749, weight = up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_227_cast_fp16)[name = tensor("k_81_cast_fp16")]; + tensor var_8755 = const()[name = tensor("op_8755"), val = tensor([1, 1])]; + tensor var_8757 = const()[name = tensor("op_8757"), val = tensor([1, 1])]; + tensor v_41_pad_type_0 = const()[name = tensor("v_41_pad_type_0"), val = tensor("custom")]; + tensor v_41_pad_0 = const()[name = tensor("v_41_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1584525376)))]; + tensor v_41_cast_fp16 = conv(dilations = var_8757, groups = var_8627, pad = v_41_pad_0, pad_type = v_41_pad_type_0, strides = var_8755, weight = up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_227_cast_fp16)[name = tensor("v_41_cast_fp16")]; + tensor var_8761_begin_0 = const()[name = tensor("op_8761_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_8761_end_0 = const()[name = tensor("op_8761_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_8761_end_mask_0 = const()[name = tensor("op_8761_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8761_cast_fp16 = slice_by_index(begin = var_8761_begin_0, end = var_8761_end_0, end_mask = var_8761_end_mask_0, x = q_41_cast_fp16)[name = tensor("op_8761_cast_fp16")]; + tensor var_8765_begin_0 = const()[name = tensor("op_8765_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_8765_end_0 = const()[name = tensor("op_8765_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_8765_end_mask_0 = const()[name = tensor("op_8765_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8765_cast_fp16 = slice_by_index(begin = var_8765_begin_0, end = var_8765_end_0, end_mask = var_8765_end_mask_0, x = q_41_cast_fp16)[name = tensor("op_8765_cast_fp16")]; + tensor var_8769_begin_0 = const()[name = tensor("op_8769_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_8769_end_0 = const()[name = tensor("op_8769_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_8769_end_mask_0 = const()[name = tensor("op_8769_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8769_cast_fp16 = slice_by_index(begin = var_8769_begin_0, end = var_8769_end_0, end_mask = var_8769_end_mask_0, x = q_41_cast_fp16)[name = tensor("op_8769_cast_fp16")]; + tensor var_8773_begin_0 = const()[name = tensor("op_8773_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_8773_end_0 = const()[name = tensor("op_8773_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_8773_end_mask_0 = const()[name = tensor("op_8773_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8773_cast_fp16 = slice_by_index(begin = var_8773_begin_0, end = var_8773_end_0, end_mask = var_8773_end_mask_0, x = q_41_cast_fp16)[name = tensor("op_8773_cast_fp16")]; + tensor var_8777_begin_0 = const()[name = tensor("op_8777_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_8777_end_0 = const()[name = tensor("op_8777_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_8777_end_mask_0 = const()[name = tensor("op_8777_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8777_cast_fp16 = slice_by_index(begin = var_8777_begin_0, end = var_8777_end_0, end_mask = var_8777_end_mask_0, x = q_41_cast_fp16)[name = tensor("op_8777_cast_fp16")]; + tensor var_8781_begin_0 = const()[name = tensor("op_8781_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_8781_end_0 = const()[name = tensor("op_8781_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_8781_end_mask_0 = const()[name = tensor("op_8781_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8781_cast_fp16 = slice_by_index(begin = var_8781_begin_0, end = var_8781_end_0, end_mask = var_8781_end_mask_0, x = q_41_cast_fp16)[name = tensor("op_8781_cast_fp16")]; + tensor var_8785_begin_0 = const()[name = tensor("op_8785_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_8785_end_0 = const()[name = tensor("op_8785_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_8785_end_mask_0 = const()[name = tensor("op_8785_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8785_cast_fp16 = slice_by_index(begin = var_8785_begin_0, end = var_8785_end_0, end_mask = var_8785_end_mask_0, x = q_41_cast_fp16)[name = tensor("op_8785_cast_fp16")]; + tensor var_8789_begin_0 = const()[name = tensor("op_8789_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_8789_end_0 = const()[name = tensor("op_8789_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_8789_end_mask_0 = const()[name = tensor("op_8789_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8789_cast_fp16 = slice_by_index(begin = var_8789_begin_0, end = var_8789_end_0, end_mask = var_8789_end_mask_0, x = q_41_cast_fp16)[name = tensor("op_8789_cast_fp16")]; + tensor var_8793_begin_0 = const()[name = tensor("op_8793_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_8793_end_0 = const()[name = tensor("op_8793_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_8793_end_mask_0 = const()[name = tensor("op_8793_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8793_cast_fp16 = slice_by_index(begin = var_8793_begin_0, end = var_8793_end_0, end_mask = var_8793_end_mask_0, x = q_41_cast_fp16)[name = tensor("op_8793_cast_fp16")]; + tensor var_8797_begin_0 = const()[name = tensor("op_8797_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_8797_end_0 = const()[name = tensor("op_8797_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_8797_end_mask_0 = const()[name = tensor("op_8797_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8797_cast_fp16 = slice_by_index(begin = var_8797_begin_0, end = var_8797_end_0, end_mask = var_8797_end_mask_0, x = q_41_cast_fp16)[name = tensor("op_8797_cast_fp16")]; + tensor k_83_perm_0 = const()[name = tensor("k_83_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_8804_begin_0 = const()[name = tensor("op_8804_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_8804_end_0 = const()[name = tensor("op_8804_end_0"), val = tensor([2, 576, 1, 64])]; + tensor var_8804_end_mask_0 = const()[name = tensor("op_8804_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_11 = transpose(perm = k_83_perm_0, x = k_81_cast_fp16)[name = tensor("transpose_11")]; + tensor var_8804_cast_fp16 = slice_by_index(begin = var_8804_begin_0, end = var_8804_end_0, end_mask = var_8804_end_mask_0, x = transpose_11)[name = tensor("op_8804_cast_fp16")]; + tensor var_8808_begin_0 = const()[name = tensor("op_8808_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_8808_end_0 = const()[name = tensor("op_8808_end_0"), val = tensor([2, 576, 1, 128])]; + tensor var_8808_end_mask_0 = const()[name = tensor("op_8808_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8808_cast_fp16 = slice_by_index(begin = var_8808_begin_0, end = var_8808_end_0, end_mask = var_8808_end_mask_0, x = transpose_11)[name = tensor("op_8808_cast_fp16")]; + tensor var_8812_begin_0 = const()[name = tensor("op_8812_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_8812_end_0 = const()[name = tensor("op_8812_end_0"), val = tensor([2, 576, 1, 192])]; + tensor var_8812_end_mask_0 = const()[name = tensor("op_8812_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8812_cast_fp16 = slice_by_index(begin = var_8812_begin_0, end = var_8812_end_0, end_mask = var_8812_end_mask_0, x = transpose_11)[name = tensor("op_8812_cast_fp16")]; + tensor var_8816_begin_0 = const()[name = tensor("op_8816_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_8816_end_0 = const()[name = tensor("op_8816_end_0"), val = tensor([2, 576, 1, 256])]; + tensor var_8816_end_mask_0 = const()[name = tensor("op_8816_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8816_cast_fp16 = slice_by_index(begin = var_8816_begin_0, end = var_8816_end_0, end_mask = var_8816_end_mask_0, x = transpose_11)[name = tensor("op_8816_cast_fp16")]; + tensor var_8820_begin_0 = const()[name = tensor("op_8820_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_8820_end_0 = const()[name = tensor("op_8820_end_0"), val = tensor([2, 576, 1, 320])]; + tensor var_8820_end_mask_0 = const()[name = tensor("op_8820_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8820_cast_fp16 = slice_by_index(begin = var_8820_begin_0, end = var_8820_end_0, end_mask = var_8820_end_mask_0, x = transpose_11)[name = tensor("op_8820_cast_fp16")]; + tensor var_8824_begin_0 = const()[name = tensor("op_8824_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_8824_end_0 = const()[name = tensor("op_8824_end_0"), val = tensor([2, 576, 1, 384])]; + tensor var_8824_end_mask_0 = const()[name = tensor("op_8824_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8824_cast_fp16 = slice_by_index(begin = var_8824_begin_0, end = var_8824_end_0, end_mask = var_8824_end_mask_0, x = transpose_11)[name = tensor("op_8824_cast_fp16")]; + tensor var_8828_begin_0 = const()[name = tensor("op_8828_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_8828_end_0 = const()[name = tensor("op_8828_end_0"), val = tensor([2, 576, 1, 448])]; + tensor var_8828_end_mask_0 = const()[name = tensor("op_8828_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8828_cast_fp16 = slice_by_index(begin = var_8828_begin_0, end = var_8828_end_0, end_mask = var_8828_end_mask_0, x = transpose_11)[name = tensor("op_8828_cast_fp16")]; + tensor var_8832_begin_0 = const()[name = tensor("op_8832_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_8832_end_0 = const()[name = tensor("op_8832_end_0"), val = tensor([2, 576, 1, 512])]; + tensor var_8832_end_mask_0 = const()[name = tensor("op_8832_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8832_cast_fp16 = slice_by_index(begin = var_8832_begin_0, end = var_8832_end_0, end_mask = var_8832_end_mask_0, x = transpose_11)[name = tensor("op_8832_cast_fp16")]; + tensor var_8836_begin_0 = const()[name = tensor("op_8836_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_8836_end_0 = const()[name = tensor("op_8836_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_8836_end_mask_0 = const()[name = tensor("op_8836_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8836_cast_fp16 = slice_by_index(begin = var_8836_begin_0, end = var_8836_end_0, end_mask = var_8836_end_mask_0, x = transpose_11)[name = tensor("op_8836_cast_fp16")]; + tensor var_8840_begin_0 = const()[name = tensor("op_8840_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_8840_end_0 = const()[name = tensor("op_8840_end_0"), val = tensor([2, 576, 1, 640])]; + tensor var_8840_end_mask_0 = const()[name = tensor("op_8840_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_8840_cast_fp16 = slice_by_index(begin = var_8840_begin_0, end = var_8840_end_0, end_mask = var_8840_end_mask_0, x = transpose_11)[name = tensor("op_8840_cast_fp16")]; + tensor var_8842_begin_0 = const()[name = tensor("op_8842_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_8842_end_0 = const()[name = tensor("op_8842_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_8842_end_mask_0 = const()[name = tensor("op_8842_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8842_cast_fp16 = slice_by_index(begin = var_8842_begin_0, end = var_8842_end_0, end_mask = var_8842_end_mask_0, x = v_41_cast_fp16)[name = tensor("op_8842_cast_fp16")]; + tensor var_8846_begin_0 = const()[name = tensor("op_8846_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_8846_end_0 = const()[name = tensor("op_8846_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_8846_end_mask_0 = const()[name = tensor("op_8846_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8846_cast_fp16 = slice_by_index(begin = var_8846_begin_0, end = var_8846_end_0, end_mask = var_8846_end_mask_0, x = v_41_cast_fp16)[name = tensor("op_8846_cast_fp16")]; + tensor var_8850_begin_0 = const()[name = tensor("op_8850_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_8850_end_0 = const()[name = tensor("op_8850_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_8850_end_mask_0 = const()[name = tensor("op_8850_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8850_cast_fp16 = slice_by_index(begin = var_8850_begin_0, end = var_8850_end_0, end_mask = var_8850_end_mask_0, x = v_41_cast_fp16)[name = tensor("op_8850_cast_fp16")]; + tensor var_8854_begin_0 = const()[name = tensor("op_8854_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_8854_end_0 = const()[name = tensor("op_8854_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_8854_end_mask_0 = const()[name = tensor("op_8854_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8854_cast_fp16 = slice_by_index(begin = var_8854_begin_0, end = var_8854_end_0, end_mask = var_8854_end_mask_0, x = v_41_cast_fp16)[name = tensor("op_8854_cast_fp16")]; + tensor var_8858_begin_0 = const()[name = tensor("op_8858_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_8858_end_0 = const()[name = tensor("op_8858_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_8858_end_mask_0 = const()[name = tensor("op_8858_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8858_cast_fp16 = slice_by_index(begin = var_8858_begin_0, end = var_8858_end_0, end_mask = var_8858_end_mask_0, x = v_41_cast_fp16)[name = tensor("op_8858_cast_fp16")]; + tensor var_8862_begin_0 = const()[name = tensor("op_8862_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_8862_end_0 = const()[name = tensor("op_8862_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_8862_end_mask_0 = const()[name = tensor("op_8862_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8862_cast_fp16 = slice_by_index(begin = var_8862_begin_0, end = var_8862_end_0, end_mask = var_8862_end_mask_0, x = v_41_cast_fp16)[name = tensor("op_8862_cast_fp16")]; + tensor var_8866_begin_0 = const()[name = tensor("op_8866_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_8866_end_0 = const()[name = tensor("op_8866_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_8866_end_mask_0 = const()[name = tensor("op_8866_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8866_cast_fp16 = slice_by_index(begin = var_8866_begin_0, end = var_8866_end_0, end_mask = var_8866_end_mask_0, x = v_41_cast_fp16)[name = tensor("op_8866_cast_fp16")]; + tensor var_8870_begin_0 = const()[name = tensor("op_8870_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_8870_end_0 = const()[name = tensor("op_8870_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_8870_end_mask_0 = const()[name = tensor("op_8870_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8870_cast_fp16 = slice_by_index(begin = var_8870_begin_0, end = var_8870_end_0, end_mask = var_8870_end_mask_0, x = v_41_cast_fp16)[name = tensor("op_8870_cast_fp16")]; + tensor var_8874_begin_0 = const()[name = tensor("op_8874_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_8874_end_0 = const()[name = tensor("op_8874_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_8874_end_mask_0 = const()[name = tensor("op_8874_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8874_cast_fp16 = slice_by_index(begin = var_8874_begin_0, end = var_8874_end_0, end_mask = var_8874_end_mask_0, x = v_41_cast_fp16)[name = tensor("op_8874_cast_fp16")]; + tensor var_8878_begin_0 = const()[name = tensor("op_8878_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_8878_end_0 = const()[name = tensor("op_8878_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_8878_end_mask_0 = const()[name = tensor("op_8878_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_8878_cast_fp16 = slice_by_index(begin = var_8878_begin_0, end = var_8878_end_0, end_mask = var_8878_end_mask_0, x = v_41_cast_fp16)[name = tensor("op_8878_cast_fp16")]; + tensor var_8882_equation_0 = const()[name = tensor("op_8882_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8882_cast_fp16 = einsum(equation = var_8882_equation_0, values = (var_8804_cast_fp16, var_8761_cast_fp16))[name = tensor("op_8882_cast_fp16")]; + tensor var_8883_to_fp16 = const()[name = tensor("op_8883_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_601_cast_fp16 = mul(x = var_8882_cast_fp16, y = var_8883_to_fp16)[name = tensor("aw_601_cast_fp16")]; + tensor var_8886_equation_0 = const()[name = tensor("op_8886_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8886_cast_fp16 = einsum(equation = var_8886_equation_0, values = (var_8808_cast_fp16, var_8765_cast_fp16))[name = tensor("op_8886_cast_fp16")]; + tensor var_8887_to_fp16 = const()[name = tensor("op_8887_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_603_cast_fp16 = mul(x = var_8886_cast_fp16, y = var_8887_to_fp16)[name = tensor("aw_603_cast_fp16")]; + tensor var_8890_equation_0 = const()[name = tensor("op_8890_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8890_cast_fp16 = einsum(equation = var_8890_equation_0, values = (var_8812_cast_fp16, var_8769_cast_fp16))[name = tensor("op_8890_cast_fp16")]; + tensor var_8891_to_fp16 = const()[name = tensor("op_8891_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_605_cast_fp16 = mul(x = var_8890_cast_fp16, y = var_8891_to_fp16)[name = tensor("aw_605_cast_fp16")]; + tensor var_8894_equation_0 = const()[name = tensor("op_8894_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8894_cast_fp16 = einsum(equation = var_8894_equation_0, values = (var_8816_cast_fp16, var_8773_cast_fp16))[name = tensor("op_8894_cast_fp16")]; + tensor var_8895_to_fp16 = const()[name = tensor("op_8895_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_607_cast_fp16 = mul(x = var_8894_cast_fp16, y = var_8895_to_fp16)[name = tensor("aw_607_cast_fp16")]; + tensor var_8898_equation_0 = const()[name = tensor("op_8898_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8898_cast_fp16 = einsum(equation = var_8898_equation_0, values = (var_8820_cast_fp16, var_8777_cast_fp16))[name = tensor("op_8898_cast_fp16")]; + tensor var_8899_to_fp16 = const()[name = tensor("op_8899_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_609_cast_fp16 = mul(x = var_8898_cast_fp16, y = var_8899_to_fp16)[name = tensor("aw_609_cast_fp16")]; + tensor var_8902_equation_0 = const()[name = tensor("op_8902_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8902_cast_fp16 = einsum(equation = var_8902_equation_0, values = (var_8824_cast_fp16, var_8781_cast_fp16))[name = tensor("op_8902_cast_fp16")]; + tensor var_8903_to_fp16 = const()[name = tensor("op_8903_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_611_cast_fp16 = mul(x = var_8902_cast_fp16, y = var_8903_to_fp16)[name = tensor("aw_611_cast_fp16")]; + tensor var_8906_equation_0 = const()[name = tensor("op_8906_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8906_cast_fp16 = einsum(equation = var_8906_equation_0, values = (var_8828_cast_fp16, var_8785_cast_fp16))[name = tensor("op_8906_cast_fp16")]; + tensor var_8907_to_fp16 = const()[name = tensor("op_8907_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_613_cast_fp16 = mul(x = var_8906_cast_fp16, y = var_8907_to_fp16)[name = tensor("aw_613_cast_fp16")]; + tensor var_8910_equation_0 = const()[name = tensor("op_8910_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8910_cast_fp16 = einsum(equation = var_8910_equation_0, values = (var_8832_cast_fp16, var_8789_cast_fp16))[name = tensor("op_8910_cast_fp16")]; + tensor var_8911_to_fp16 = const()[name = tensor("op_8911_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_615_cast_fp16 = mul(x = var_8910_cast_fp16, y = var_8911_to_fp16)[name = tensor("aw_615_cast_fp16")]; + tensor var_8914_equation_0 = const()[name = tensor("op_8914_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8914_cast_fp16 = einsum(equation = var_8914_equation_0, values = (var_8836_cast_fp16, var_8793_cast_fp16))[name = tensor("op_8914_cast_fp16")]; + tensor var_8915_to_fp16 = const()[name = tensor("op_8915_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_617_cast_fp16 = mul(x = var_8914_cast_fp16, y = var_8915_to_fp16)[name = tensor("aw_617_cast_fp16")]; + tensor var_8918_equation_0 = const()[name = tensor("op_8918_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_8918_cast_fp16 = einsum(equation = var_8918_equation_0, values = (var_8840_cast_fp16, var_8797_cast_fp16))[name = tensor("op_8918_cast_fp16")]; + tensor var_8919_to_fp16 = const()[name = tensor("op_8919_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_619_cast_fp16 = mul(x = var_8918_cast_fp16, y = var_8919_to_fp16)[name = tensor("aw_619_cast_fp16")]; + tensor var_8921_cast_fp16 = softmax(axis = var_8627, x = aw_601_cast_fp16)[name = tensor("op_8921_cast_fp16")]; + tensor var_8922_cast_fp16 = softmax(axis = var_8627, x = aw_603_cast_fp16)[name = tensor("op_8922_cast_fp16")]; + tensor var_8923_cast_fp16 = softmax(axis = var_8627, x = aw_605_cast_fp16)[name = tensor("op_8923_cast_fp16")]; + tensor var_8924_cast_fp16 = softmax(axis = var_8627, x = aw_607_cast_fp16)[name = tensor("op_8924_cast_fp16")]; + tensor var_8925_cast_fp16 = softmax(axis = var_8627, x = aw_609_cast_fp16)[name = tensor("op_8925_cast_fp16")]; + tensor var_8926_cast_fp16 = softmax(axis = var_8627, x = aw_611_cast_fp16)[name = tensor("op_8926_cast_fp16")]; + tensor var_8927_cast_fp16 = softmax(axis = var_8627, x = aw_613_cast_fp16)[name = tensor("op_8927_cast_fp16")]; + tensor var_8928_cast_fp16 = softmax(axis = var_8627, x = aw_615_cast_fp16)[name = tensor("op_8928_cast_fp16")]; + tensor var_8929_cast_fp16 = softmax(axis = var_8627, x = aw_617_cast_fp16)[name = tensor("op_8929_cast_fp16")]; + tensor var_8930_cast_fp16 = softmax(axis = var_8627, x = aw_619_cast_fp16)[name = tensor("op_8930_cast_fp16")]; + tensor var_8932_equation_0 = const()[name = tensor("op_8932_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8932_cast_fp16 = einsum(equation = var_8932_equation_0, values = (var_8842_cast_fp16, var_8921_cast_fp16))[name = tensor("op_8932_cast_fp16")]; + tensor var_8934_equation_0 = const()[name = tensor("op_8934_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8934_cast_fp16 = einsum(equation = var_8934_equation_0, values = (var_8846_cast_fp16, var_8922_cast_fp16))[name = tensor("op_8934_cast_fp16")]; + tensor var_8936_equation_0 = const()[name = tensor("op_8936_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8936_cast_fp16 = einsum(equation = var_8936_equation_0, values = (var_8850_cast_fp16, var_8923_cast_fp16))[name = tensor("op_8936_cast_fp16")]; + tensor var_8938_equation_0 = const()[name = tensor("op_8938_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8938_cast_fp16 = einsum(equation = var_8938_equation_0, values = (var_8854_cast_fp16, var_8924_cast_fp16))[name = tensor("op_8938_cast_fp16")]; + tensor var_8940_equation_0 = const()[name = tensor("op_8940_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8940_cast_fp16 = einsum(equation = var_8940_equation_0, values = (var_8858_cast_fp16, var_8925_cast_fp16))[name = tensor("op_8940_cast_fp16")]; + tensor var_8942_equation_0 = const()[name = tensor("op_8942_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8942_cast_fp16 = einsum(equation = var_8942_equation_0, values = (var_8862_cast_fp16, var_8926_cast_fp16))[name = tensor("op_8942_cast_fp16")]; + tensor var_8944_equation_0 = const()[name = tensor("op_8944_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8944_cast_fp16 = einsum(equation = var_8944_equation_0, values = (var_8866_cast_fp16, var_8927_cast_fp16))[name = tensor("op_8944_cast_fp16")]; + tensor var_8946_equation_0 = const()[name = tensor("op_8946_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8946_cast_fp16 = einsum(equation = var_8946_equation_0, values = (var_8870_cast_fp16, var_8928_cast_fp16))[name = tensor("op_8946_cast_fp16")]; + tensor var_8948_equation_0 = const()[name = tensor("op_8948_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8948_cast_fp16 = einsum(equation = var_8948_equation_0, values = (var_8874_cast_fp16, var_8929_cast_fp16))[name = tensor("op_8948_cast_fp16")]; + tensor var_8950_equation_0 = const()[name = tensor("op_8950_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_8950_cast_fp16 = einsum(equation = var_8950_equation_0, values = (var_8878_cast_fp16, var_8930_cast_fp16))[name = tensor("op_8950_cast_fp16")]; + tensor input_383_interleave_0 = const()[name = tensor("input_383_interleave_0"), val = tensor(false)]; + tensor input_383_cast_fp16 = concat(axis = var_8627, interleave = input_383_interleave_0, values = (var_8932_cast_fp16, var_8934_cast_fp16, var_8936_cast_fp16, var_8938_cast_fp16, var_8940_cast_fp16, var_8942_cast_fp16, var_8944_cast_fp16, var_8946_cast_fp16, var_8948_cast_fp16, var_8950_cast_fp16))[name = tensor("input_383_cast_fp16")]; + tensor var_8956 = const()[name = tensor("op_8956"), val = tensor([1, 1])]; + tensor var_8958 = const()[name = tensor("op_8958"), val = tensor([1, 1])]; + tensor var_8960_pad_type_0 = const()[name = tensor("op_8960_pad_type_0"), val = tensor("custom")]; + tensor var_8960_pad_0 = const()[name = tensor("op_8960_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1585344640)))]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1586163904)))]; + tensor var_8960_cast_fp16 = conv(bias = up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_8958, groups = var_8627, pad = var_8960_pad_0, pad_type = var_8960_pad_type_0, strides = var_8956, weight = up_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_383_cast_fp16)[name = tensor("op_8960_cast_fp16")]; + tensor inputs_63_cast_fp16 = add(x = var_8960_cast_fp16, y = inputs_61_cast_fp16)[name = tensor("inputs_63_cast_fp16")]; + tensor var_8964 = const()[name = tensor("op_8964"), val = tensor([1])]; + tensor channels_mean_63_cast_fp16 = reduce_mean(axes = var_8964, keep_dims = var_8622, x = inputs_63_cast_fp16)[name = tensor("channels_mean_63_cast_fp16")]; + tensor zero_mean_63_cast_fp16 = sub(x = inputs_63_cast_fp16, y = channels_mean_63_cast_fp16)[name = tensor("zero_mean_63_cast_fp16")]; + tensor zero_mean_sq_63_cast_fp16 = mul(x = zero_mean_63_cast_fp16, y = zero_mean_63_cast_fp16)[name = tensor("zero_mean_sq_63_cast_fp16")]; + tensor var_8968 = const()[name = tensor("op_8968"), val = tensor([1])]; + tensor var_8969_cast_fp16 = reduce_mean(axes = var_8968, keep_dims = var_8622, x = zero_mean_sq_63_cast_fp16)[name = tensor("op_8969_cast_fp16")]; + tensor var_8970_to_fp16 = const()[name = tensor("op_8970_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_8971_cast_fp16 = add(x = var_8969_cast_fp16, y = var_8970_to_fp16)[name = tensor("op_8971_cast_fp16")]; + tensor denom_63_epsilon_0_to_fp16 = const()[name = tensor("denom_63_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_63_cast_fp16 = rsqrt(epsilon = denom_63_epsilon_0_to_fp16, x = var_8971_cast_fp16)[name = tensor("denom_63_cast_fp16")]; + tensor out_63_cast_fp16 = mul(x = zero_mean_63_cast_fp16, y = denom_63_cast_fp16)[name = tensor("out_63_cast_fp16")]; + tensor var_8975_to_fp16 = const()[name = tensor("op_8975_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1586165248)))]; + tensor var_8976_cast_fp16 = add(x = out_63_cast_fp16, y = var_8975_to_fp16)[name = tensor("op_8976_cast_fp16")]; + tensor var_8978_to_fp16 = const()[name = tensor("op_8978_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1586166592)))]; + tensor hidden_states_229_cast_fp16 = mul(x = var_8976_cast_fp16, y = var_8978_to_fp16)[name = tensor("hidden_states_229_cast_fp16")]; + tensor var_8985 = const()[name = tensor("op_8985"), val = tensor([1, 1])]; + tensor var_8987 = const()[name = tensor("op_8987"), val = tensor([1, 1])]; + tensor q_43_pad_type_0 = const()[name = tensor("q_43_pad_type_0"), val = tensor("custom")]; + tensor q_43_pad_0 = const()[name = tensor("q_43_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1586167936)))]; + tensor q_43_cast_fp16 = conv(dilations = var_8987, groups = var_8627, pad = q_43_pad_0, pad_type = q_43_pad_type_0, strides = var_8985, weight = up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_229_cast_fp16)[name = tensor("q_43_cast_fp16")]; + tensor var_8991 = const()[name = tensor("op_8991"), val = tensor([1, 1])]; + tensor var_8993 = const()[name = tensor("op_8993"), val = tensor([1, 1])]; + tensor k_85_pad_type_0 = const()[name = tensor("k_85_pad_type_0"), val = tensor("custom")]; + tensor k_85_pad_0 = const()[name = tensor("k_85_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1586987200)))]; + tensor k_85_cast_fp16 = conv(dilations = var_8993, groups = var_8627, pad = k_85_pad_0, pad_type = k_85_pad_type_0, strides = var_8991, weight = up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_85_cast_fp16")]; + tensor var_8997 = const()[name = tensor("op_8997"), val = tensor([1, 1])]; + tensor var_8999 = const()[name = tensor("op_8999"), val = tensor([1, 1])]; + tensor v_43_pad_type_0 = const()[name = tensor("v_43_pad_type_0"), val = tensor("custom")]; + tensor v_43_pad_0 = const()[name = tensor("v_43_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1588297984)))]; + tensor v_43_cast_fp16 = conv(dilations = var_8999, groups = var_8627, pad = v_43_pad_0, pad_type = v_43_pad_type_0, strides = var_8997, weight = up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_43_cast_fp16")]; + tensor var_9003_begin_0 = const()[name = tensor("op_9003_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_9003_end_0 = const()[name = tensor("op_9003_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_9003_end_mask_0 = const()[name = tensor("op_9003_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9003_cast_fp16 = slice_by_index(begin = var_9003_begin_0, end = var_9003_end_0, end_mask = var_9003_end_mask_0, x = q_43_cast_fp16)[name = tensor("op_9003_cast_fp16")]; + tensor var_9007_begin_0 = const()[name = tensor("op_9007_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_9007_end_0 = const()[name = tensor("op_9007_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_9007_end_mask_0 = const()[name = tensor("op_9007_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9007_cast_fp16 = slice_by_index(begin = var_9007_begin_0, end = var_9007_end_0, end_mask = var_9007_end_mask_0, x = q_43_cast_fp16)[name = tensor("op_9007_cast_fp16")]; + tensor var_9011_begin_0 = const()[name = tensor("op_9011_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_9011_end_0 = const()[name = tensor("op_9011_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_9011_end_mask_0 = const()[name = tensor("op_9011_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9011_cast_fp16 = slice_by_index(begin = var_9011_begin_0, end = var_9011_end_0, end_mask = var_9011_end_mask_0, x = q_43_cast_fp16)[name = tensor("op_9011_cast_fp16")]; + tensor var_9015_begin_0 = const()[name = tensor("op_9015_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_9015_end_0 = const()[name = tensor("op_9015_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_9015_end_mask_0 = const()[name = tensor("op_9015_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9015_cast_fp16 = slice_by_index(begin = var_9015_begin_0, end = var_9015_end_0, end_mask = var_9015_end_mask_0, x = q_43_cast_fp16)[name = tensor("op_9015_cast_fp16")]; + tensor var_9019_begin_0 = const()[name = tensor("op_9019_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_9019_end_0 = const()[name = tensor("op_9019_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_9019_end_mask_0 = const()[name = tensor("op_9019_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9019_cast_fp16 = slice_by_index(begin = var_9019_begin_0, end = var_9019_end_0, end_mask = var_9019_end_mask_0, x = q_43_cast_fp16)[name = tensor("op_9019_cast_fp16")]; + tensor var_9023_begin_0 = const()[name = tensor("op_9023_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_9023_end_0 = const()[name = tensor("op_9023_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_9023_end_mask_0 = const()[name = tensor("op_9023_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9023_cast_fp16 = slice_by_index(begin = var_9023_begin_0, end = var_9023_end_0, end_mask = var_9023_end_mask_0, x = q_43_cast_fp16)[name = tensor("op_9023_cast_fp16")]; + tensor var_9027_begin_0 = const()[name = tensor("op_9027_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_9027_end_0 = const()[name = tensor("op_9027_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_9027_end_mask_0 = const()[name = tensor("op_9027_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9027_cast_fp16 = slice_by_index(begin = var_9027_begin_0, end = var_9027_end_0, end_mask = var_9027_end_mask_0, x = q_43_cast_fp16)[name = tensor("op_9027_cast_fp16")]; + tensor var_9031_begin_0 = const()[name = tensor("op_9031_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_9031_end_0 = const()[name = tensor("op_9031_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_9031_end_mask_0 = const()[name = tensor("op_9031_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9031_cast_fp16 = slice_by_index(begin = var_9031_begin_0, end = var_9031_end_0, end_mask = var_9031_end_mask_0, x = q_43_cast_fp16)[name = tensor("op_9031_cast_fp16")]; + tensor var_9035_begin_0 = const()[name = tensor("op_9035_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_9035_end_0 = const()[name = tensor("op_9035_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_9035_end_mask_0 = const()[name = tensor("op_9035_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9035_cast_fp16 = slice_by_index(begin = var_9035_begin_0, end = var_9035_end_0, end_mask = var_9035_end_mask_0, x = q_43_cast_fp16)[name = tensor("op_9035_cast_fp16")]; + tensor var_9039_begin_0 = const()[name = tensor("op_9039_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_9039_end_0 = const()[name = tensor("op_9039_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_9039_end_mask_0 = const()[name = tensor("op_9039_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9039_cast_fp16 = slice_by_index(begin = var_9039_begin_0, end = var_9039_end_0, end_mask = var_9039_end_mask_0, x = q_43_cast_fp16)[name = tensor("op_9039_cast_fp16")]; + tensor k_87_perm_0 = const()[name = tensor("k_87_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_9046_begin_0 = const()[name = tensor("op_9046_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_9046_end_0 = const()[name = tensor("op_9046_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_9046_end_mask_0 = const()[name = tensor("op_9046_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_10 = transpose(perm = k_87_perm_0, x = k_85_cast_fp16)[name = tensor("transpose_10")]; + tensor var_9046_cast_fp16 = slice_by_index(begin = var_9046_begin_0, end = var_9046_end_0, end_mask = var_9046_end_mask_0, x = transpose_10)[name = tensor("op_9046_cast_fp16")]; + tensor var_9050_begin_0 = const()[name = tensor("op_9050_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_9050_end_0 = const()[name = tensor("op_9050_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_9050_end_mask_0 = const()[name = tensor("op_9050_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9050_cast_fp16 = slice_by_index(begin = var_9050_begin_0, end = var_9050_end_0, end_mask = var_9050_end_mask_0, x = transpose_10)[name = tensor("op_9050_cast_fp16")]; + tensor var_9054_begin_0 = const()[name = tensor("op_9054_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_9054_end_0 = const()[name = tensor("op_9054_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_9054_end_mask_0 = const()[name = tensor("op_9054_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9054_cast_fp16 = slice_by_index(begin = var_9054_begin_0, end = var_9054_end_0, end_mask = var_9054_end_mask_0, x = transpose_10)[name = tensor("op_9054_cast_fp16")]; + tensor var_9058_begin_0 = const()[name = tensor("op_9058_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_9058_end_0 = const()[name = tensor("op_9058_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_9058_end_mask_0 = const()[name = tensor("op_9058_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9058_cast_fp16 = slice_by_index(begin = var_9058_begin_0, end = var_9058_end_0, end_mask = var_9058_end_mask_0, x = transpose_10)[name = tensor("op_9058_cast_fp16")]; + tensor var_9062_begin_0 = const()[name = tensor("op_9062_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_9062_end_0 = const()[name = tensor("op_9062_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_9062_end_mask_0 = const()[name = tensor("op_9062_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9062_cast_fp16 = slice_by_index(begin = var_9062_begin_0, end = var_9062_end_0, end_mask = var_9062_end_mask_0, x = transpose_10)[name = tensor("op_9062_cast_fp16")]; + tensor var_9066_begin_0 = const()[name = tensor("op_9066_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_9066_end_0 = const()[name = tensor("op_9066_end_0"), val = tensor([2, 77, 1, 384])]; + tensor var_9066_end_mask_0 = const()[name = tensor("op_9066_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9066_cast_fp16 = slice_by_index(begin = var_9066_begin_0, end = var_9066_end_0, end_mask = var_9066_end_mask_0, x = transpose_10)[name = tensor("op_9066_cast_fp16")]; + tensor var_9070_begin_0 = const()[name = tensor("op_9070_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_9070_end_0 = const()[name = tensor("op_9070_end_0"), val = tensor([2, 77, 1, 448])]; + tensor var_9070_end_mask_0 = const()[name = tensor("op_9070_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9070_cast_fp16 = slice_by_index(begin = var_9070_begin_0, end = var_9070_end_0, end_mask = var_9070_end_mask_0, x = transpose_10)[name = tensor("op_9070_cast_fp16")]; + tensor var_9074_begin_0 = const()[name = tensor("op_9074_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_9074_end_0 = const()[name = tensor("op_9074_end_0"), val = tensor([2, 77, 1, 512])]; + tensor var_9074_end_mask_0 = const()[name = tensor("op_9074_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9074_cast_fp16 = slice_by_index(begin = var_9074_begin_0, end = var_9074_end_0, end_mask = var_9074_end_mask_0, x = transpose_10)[name = tensor("op_9074_cast_fp16")]; + tensor var_9078_begin_0 = const()[name = tensor("op_9078_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_9078_end_0 = const()[name = tensor("op_9078_end_0"), val = tensor([2, 77, 1, 576])]; + tensor var_9078_end_mask_0 = const()[name = tensor("op_9078_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9078_cast_fp16 = slice_by_index(begin = var_9078_begin_0, end = var_9078_end_0, end_mask = var_9078_end_mask_0, x = transpose_10)[name = tensor("op_9078_cast_fp16")]; + tensor var_9082_begin_0 = const()[name = tensor("op_9082_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_9082_end_0 = const()[name = tensor("op_9082_end_0"), val = tensor([2, 77, 1, 640])]; + tensor var_9082_end_mask_0 = const()[name = tensor("op_9082_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9082_cast_fp16 = slice_by_index(begin = var_9082_begin_0, end = var_9082_end_0, end_mask = var_9082_end_mask_0, x = transpose_10)[name = tensor("op_9082_cast_fp16")]; + tensor var_9084_begin_0 = const()[name = tensor("op_9084_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_9084_end_0 = const()[name = tensor("op_9084_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_9084_end_mask_0 = const()[name = tensor("op_9084_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9084_cast_fp16 = slice_by_index(begin = var_9084_begin_0, end = var_9084_end_0, end_mask = var_9084_end_mask_0, x = v_43_cast_fp16)[name = tensor("op_9084_cast_fp16")]; + tensor var_9088_begin_0 = const()[name = tensor("op_9088_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_9088_end_0 = const()[name = tensor("op_9088_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_9088_end_mask_0 = const()[name = tensor("op_9088_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9088_cast_fp16 = slice_by_index(begin = var_9088_begin_0, end = var_9088_end_0, end_mask = var_9088_end_mask_0, x = v_43_cast_fp16)[name = tensor("op_9088_cast_fp16")]; + tensor var_9092_begin_0 = const()[name = tensor("op_9092_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_9092_end_0 = const()[name = tensor("op_9092_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_9092_end_mask_0 = const()[name = tensor("op_9092_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9092_cast_fp16 = slice_by_index(begin = var_9092_begin_0, end = var_9092_end_0, end_mask = var_9092_end_mask_0, x = v_43_cast_fp16)[name = tensor("op_9092_cast_fp16")]; + tensor var_9096_begin_0 = const()[name = tensor("op_9096_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_9096_end_0 = const()[name = tensor("op_9096_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_9096_end_mask_0 = const()[name = tensor("op_9096_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9096_cast_fp16 = slice_by_index(begin = var_9096_begin_0, end = var_9096_end_0, end_mask = var_9096_end_mask_0, x = v_43_cast_fp16)[name = tensor("op_9096_cast_fp16")]; + tensor var_9100_begin_0 = const()[name = tensor("op_9100_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_9100_end_0 = const()[name = tensor("op_9100_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_9100_end_mask_0 = const()[name = tensor("op_9100_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9100_cast_fp16 = slice_by_index(begin = var_9100_begin_0, end = var_9100_end_0, end_mask = var_9100_end_mask_0, x = v_43_cast_fp16)[name = tensor("op_9100_cast_fp16")]; + tensor var_9104_begin_0 = const()[name = tensor("op_9104_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_9104_end_0 = const()[name = tensor("op_9104_end_0"), val = tensor([2, 384, 1, 77])]; + tensor var_9104_end_mask_0 = const()[name = tensor("op_9104_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9104_cast_fp16 = slice_by_index(begin = var_9104_begin_0, end = var_9104_end_0, end_mask = var_9104_end_mask_0, x = v_43_cast_fp16)[name = tensor("op_9104_cast_fp16")]; + tensor var_9108_begin_0 = const()[name = tensor("op_9108_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_9108_end_0 = const()[name = tensor("op_9108_end_0"), val = tensor([2, 448, 1, 77])]; + tensor var_9108_end_mask_0 = const()[name = tensor("op_9108_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9108_cast_fp16 = slice_by_index(begin = var_9108_begin_0, end = var_9108_end_0, end_mask = var_9108_end_mask_0, x = v_43_cast_fp16)[name = tensor("op_9108_cast_fp16")]; + tensor var_9112_begin_0 = const()[name = tensor("op_9112_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_9112_end_0 = const()[name = tensor("op_9112_end_0"), val = tensor([2, 512, 1, 77])]; + tensor var_9112_end_mask_0 = const()[name = tensor("op_9112_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9112_cast_fp16 = slice_by_index(begin = var_9112_begin_0, end = var_9112_end_0, end_mask = var_9112_end_mask_0, x = v_43_cast_fp16)[name = tensor("op_9112_cast_fp16")]; + tensor var_9116_begin_0 = const()[name = tensor("op_9116_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_9116_end_0 = const()[name = tensor("op_9116_end_0"), val = tensor([2, 576, 1, 77])]; + tensor var_9116_end_mask_0 = const()[name = tensor("op_9116_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9116_cast_fp16 = slice_by_index(begin = var_9116_begin_0, end = var_9116_end_0, end_mask = var_9116_end_mask_0, x = v_43_cast_fp16)[name = tensor("op_9116_cast_fp16")]; + tensor var_9120_begin_0 = const()[name = tensor("op_9120_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_9120_end_0 = const()[name = tensor("op_9120_end_0"), val = tensor([2, 640, 1, 77])]; + tensor var_9120_end_mask_0 = const()[name = tensor("op_9120_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9120_cast_fp16 = slice_by_index(begin = var_9120_begin_0, end = var_9120_end_0, end_mask = var_9120_end_mask_0, x = v_43_cast_fp16)[name = tensor("op_9120_cast_fp16")]; + tensor var_9124_equation_0 = const()[name = tensor("op_9124_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9124_cast_fp16 = einsum(equation = var_9124_equation_0, values = (var_9046_cast_fp16, var_9003_cast_fp16))[name = tensor("op_9124_cast_fp16")]; + tensor var_9125_to_fp16 = const()[name = tensor("op_9125_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_621_cast_fp16 = mul(x = var_9124_cast_fp16, y = var_9125_to_fp16)[name = tensor("aw_621_cast_fp16")]; + tensor var_9128_equation_0 = const()[name = tensor("op_9128_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9128_cast_fp16 = einsum(equation = var_9128_equation_0, values = (var_9050_cast_fp16, var_9007_cast_fp16))[name = tensor("op_9128_cast_fp16")]; + tensor var_9129_to_fp16 = const()[name = tensor("op_9129_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_623_cast_fp16 = mul(x = var_9128_cast_fp16, y = var_9129_to_fp16)[name = tensor("aw_623_cast_fp16")]; + tensor var_9132_equation_0 = const()[name = tensor("op_9132_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9132_cast_fp16 = einsum(equation = var_9132_equation_0, values = (var_9054_cast_fp16, var_9011_cast_fp16))[name = tensor("op_9132_cast_fp16")]; + tensor var_9133_to_fp16 = const()[name = tensor("op_9133_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_625_cast_fp16 = mul(x = var_9132_cast_fp16, y = var_9133_to_fp16)[name = tensor("aw_625_cast_fp16")]; + tensor var_9136_equation_0 = const()[name = tensor("op_9136_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9136_cast_fp16 = einsum(equation = var_9136_equation_0, values = (var_9058_cast_fp16, var_9015_cast_fp16))[name = tensor("op_9136_cast_fp16")]; + tensor var_9137_to_fp16 = const()[name = tensor("op_9137_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_627_cast_fp16 = mul(x = var_9136_cast_fp16, y = var_9137_to_fp16)[name = tensor("aw_627_cast_fp16")]; + tensor var_9140_equation_0 = const()[name = tensor("op_9140_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9140_cast_fp16 = einsum(equation = var_9140_equation_0, values = (var_9062_cast_fp16, var_9019_cast_fp16))[name = tensor("op_9140_cast_fp16")]; + tensor var_9141_to_fp16 = const()[name = tensor("op_9141_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_629_cast_fp16 = mul(x = var_9140_cast_fp16, y = var_9141_to_fp16)[name = tensor("aw_629_cast_fp16")]; + tensor var_9144_equation_0 = const()[name = tensor("op_9144_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9144_cast_fp16 = einsum(equation = var_9144_equation_0, values = (var_9066_cast_fp16, var_9023_cast_fp16))[name = tensor("op_9144_cast_fp16")]; + tensor var_9145_to_fp16 = const()[name = tensor("op_9145_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_631_cast_fp16 = mul(x = var_9144_cast_fp16, y = var_9145_to_fp16)[name = tensor("aw_631_cast_fp16")]; + tensor var_9148_equation_0 = const()[name = tensor("op_9148_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9148_cast_fp16 = einsum(equation = var_9148_equation_0, values = (var_9070_cast_fp16, var_9027_cast_fp16))[name = tensor("op_9148_cast_fp16")]; + tensor var_9149_to_fp16 = const()[name = tensor("op_9149_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_633_cast_fp16 = mul(x = var_9148_cast_fp16, y = var_9149_to_fp16)[name = tensor("aw_633_cast_fp16")]; + tensor var_9152_equation_0 = const()[name = tensor("op_9152_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9152_cast_fp16 = einsum(equation = var_9152_equation_0, values = (var_9074_cast_fp16, var_9031_cast_fp16))[name = tensor("op_9152_cast_fp16")]; + tensor var_9153_to_fp16 = const()[name = tensor("op_9153_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_635_cast_fp16 = mul(x = var_9152_cast_fp16, y = var_9153_to_fp16)[name = tensor("aw_635_cast_fp16")]; + tensor var_9156_equation_0 = const()[name = tensor("op_9156_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9156_cast_fp16 = einsum(equation = var_9156_equation_0, values = (var_9078_cast_fp16, var_9035_cast_fp16))[name = tensor("op_9156_cast_fp16")]; + tensor var_9157_to_fp16 = const()[name = tensor("op_9157_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_637_cast_fp16 = mul(x = var_9156_cast_fp16, y = var_9157_to_fp16)[name = tensor("aw_637_cast_fp16")]; + tensor var_9160_equation_0 = const()[name = tensor("op_9160_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9160_cast_fp16 = einsum(equation = var_9160_equation_0, values = (var_9082_cast_fp16, var_9039_cast_fp16))[name = tensor("op_9160_cast_fp16")]; + tensor var_9161_to_fp16 = const()[name = tensor("op_9161_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_639_cast_fp16 = mul(x = var_9160_cast_fp16, y = var_9161_to_fp16)[name = tensor("aw_639_cast_fp16")]; + tensor var_9163_cast_fp16 = softmax(axis = var_8627, x = aw_621_cast_fp16)[name = tensor("op_9163_cast_fp16")]; + tensor var_9164_cast_fp16 = softmax(axis = var_8627, x = aw_623_cast_fp16)[name = tensor("op_9164_cast_fp16")]; + tensor var_9165_cast_fp16 = softmax(axis = var_8627, x = aw_625_cast_fp16)[name = tensor("op_9165_cast_fp16")]; + tensor var_9166_cast_fp16 = softmax(axis = var_8627, x = aw_627_cast_fp16)[name = tensor("op_9166_cast_fp16")]; + tensor var_9167_cast_fp16 = softmax(axis = var_8627, x = aw_629_cast_fp16)[name = tensor("op_9167_cast_fp16")]; + tensor var_9168_cast_fp16 = softmax(axis = var_8627, x = aw_631_cast_fp16)[name = tensor("op_9168_cast_fp16")]; + tensor var_9169_cast_fp16 = softmax(axis = var_8627, x = aw_633_cast_fp16)[name = tensor("op_9169_cast_fp16")]; + tensor var_9170_cast_fp16 = softmax(axis = var_8627, x = aw_635_cast_fp16)[name = tensor("op_9170_cast_fp16")]; + tensor var_9171_cast_fp16 = softmax(axis = var_8627, x = aw_637_cast_fp16)[name = tensor("op_9171_cast_fp16")]; + tensor var_9172_cast_fp16 = softmax(axis = var_8627, x = aw_639_cast_fp16)[name = tensor("op_9172_cast_fp16")]; + tensor var_9174_equation_0 = const()[name = tensor("op_9174_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9174_cast_fp16 = einsum(equation = var_9174_equation_0, values = (var_9084_cast_fp16, var_9163_cast_fp16))[name = tensor("op_9174_cast_fp16")]; + tensor var_9176_equation_0 = const()[name = tensor("op_9176_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9176_cast_fp16 = einsum(equation = var_9176_equation_0, values = (var_9088_cast_fp16, var_9164_cast_fp16))[name = tensor("op_9176_cast_fp16")]; + tensor var_9178_equation_0 = const()[name = tensor("op_9178_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9178_cast_fp16 = einsum(equation = var_9178_equation_0, values = (var_9092_cast_fp16, var_9165_cast_fp16))[name = tensor("op_9178_cast_fp16")]; + tensor var_9180_equation_0 = const()[name = tensor("op_9180_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9180_cast_fp16 = einsum(equation = var_9180_equation_0, values = (var_9096_cast_fp16, var_9166_cast_fp16))[name = tensor("op_9180_cast_fp16")]; + tensor var_9182_equation_0 = const()[name = tensor("op_9182_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9182_cast_fp16 = einsum(equation = var_9182_equation_0, values = (var_9100_cast_fp16, var_9167_cast_fp16))[name = tensor("op_9182_cast_fp16")]; + tensor var_9184_equation_0 = const()[name = tensor("op_9184_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9184_cast_fp16 = einsum(equation = var_9184_equation_0, values = (var_9104_cast_fp16, var_9168_cast_fp16))[name = tensor("op_9184_cast_fp16")]; + tensor var_9186_equation_0 = const()[name = tensor("op_9186_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9186_cast_fp16 = einsum(equation = var_9186_equation_0, values = (var_9108_cast_fp16, var_9169_cast_fp16))[name = tensor("op_9186_cast_fp16")]; + tensor var_9188_equation_0 = const()[name = tensor("op_9188_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9188_cast_fp16 = einsum(equation = var_9188_equation_0, values = (var_9112_cast_fp16, var_9170_cast_fp16))[name = tensor("op_9188_cast_fp16")]; + tensor var_9190_equation_0 = const()[name = tensor("op_9190_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9190_cast_fp16 = einsum(equation = var_9190_equation_0, values = (var_9116_cast_fp16, var_9171_cast_fp16))[name = tensor("op_9190_cast_fp16")]; + tensor var_9192_equation_0 = const()[name = tensor("op_9192_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9192_cast_fp16 = einsum(equation = var_9192_equation_0, values = (var_9120_cast_fp16, var_9172_cast_fp16))[name = tensor("op_9192_cast_fp16")]; + tensor input_385_interleave_0 = const()[name = tensor("input_385_interleave_0"), val = tensor(false)]; + tensor input_385_cast_fp16 = concat(axis = var_8627, interleave = input_385_interleave_0, values = (var_9174_cast_fp16, var_9176_cast_fp16, var_9178_cast_fp16, var_9180_cast_fp16, var_9182_cast_fp16, var_9184_cast_fp16, var_9186_cast_fp16, var_9188_cast_fp16, var_9190_cast_fp16, var_9192_cast_fp16))[name = tensor("input_385_cast_fp16")]; + tensor var_9198 = const()[name = tensor("op_9198"), val = tensor([1, 1])]; + tensor var_9200 = const()[name = tensor("op_9200"), val = tensor([1, 1])]; + tensor var_9202_pad_type_0 = const()[name = tensor("op_9202_pad_type_0"), val = tensor("custom")]; + tensor var_9202_pad_0 = const()[name = tensor("op_9202_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1589608768)))]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1590428032)))]; + tensor var_9202_cast_fp16 = conv(bias = up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_9200, groups = var_8627, pad = var_9202_pad_0, pad_type = var_9202_pad_type_0, strides = var_9198, weight = up_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_385_cast_fp16)[name = tensor("op_9202_cast_fp16")]; + tensor inputs_65_cast_fp16 = add(x = var_9202_cast_fp16, y = inputs_63_cast_fp16)[name = tensor("inputs_65_cast_fp16")]; + tensor var_9206 = const()[name = tensor("op_9206"), val = tensor([1])]; + tensor channels_mean_65_cast_fp16 = reduce_mean(axes = var_9206, keep_dims = var_8622, x = inputs_65_cast_fp16)[name = tensor("channels_mean_65_cast_fp16")]; + tensor zero_mean_65_cast_fp16 = sub(x = inputs_65_cast_fp16, y = channels_mean_65_cast_fp16)[name = tensor("zero_mean_65_cast_fp16")]; + tensor zero_mean_sq_65_cast_fp16 = mul(x = zero_mean_65_cast_fp16, y = zero_mean_65_cast_fp16)[name = tensor("zero_mean_sq_65_cast_fp16")]; + tensor var_9210 = const()[name = tensor("op_9210"), val = tensor([1])]; + tensor var_9211_cast_fp16 = reduce_mean(axes = var_9210, keep_dims = var_8622, x = zero_mean_sq_65_cast_fp16)[name = tensor("op_9211_cast_fp16")]; + tensor var_9212_to_fp16 = const()[name = tensor("op_9212_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_9213_cast_fp16 = add(x = var_9211_cast_fp16, y = var_9212_to_fp16)[name = tensor("op_9213_cast_fp16")]; + tensor denom_65_epsilon_0_to_fp16 = const()[name = tensor("denom_65_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_65_cast_fp16 = rsqrt(epsilon = denom_65_epsilon_0_to_fp16, x = var_9213_cast_fp16)[name = tensor("denom_65_cast_fp16")]; + tensor out_65_cast_fp16 = mul(x = zero_mean_65_cast_fp16, y = denom_65_cast_fp16)[name = tensor("out_65_cast_fp16")]; + tensor var_9217_to_fp16 = const()[name = tensor("op_9217_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1590429376)))]; + tensor var_9218_cast_fp16 = add(x = out_65_cast_fp16, y = var_9217_to_fp16)[name = tensor("op_9218_cast_fp16")]; + tensor var_9220_to_fp16 = const()[name = tensor("op_9220_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1590430720)))]; + tensor input_387_cast_fp16 = mul(x = var_9218_cast_fp16, y = var_9220_to_fp16)[name = tensor("input_387_cast_fp16")]; + tensor var_9228 = const()[name = tensor("op_9228"), val = tensor([1, 1])]; + tensor var_9230 = const()[name = tensor("op_9230"), val = tensor([1, 1])]; + tensor var_9232_pad_type_0 = const()[name = tensor("op_9232_pad_type_0"), val = tensor("custom")]; + tensor var_9232_pad_0 = const()[name = tensor("op_9232_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1590432064)))]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1596985728)))]; + tensor var_9232_cast_fp16 = conv(bias = up_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_9230, groups = var_8627, pad = var_9232_pad_0, pad_type = var_9232_pad_type_0, strides = var_9228, weight = up_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_387_cast_fp16)[name = tensor("op_9232_cast_fp16")]; + tensor var_9233_split_sizes_0 = const()[name = tensor("op_9233_split_sizes_0"), val = tensor([2560, 2560])]; + tensor var_9233_axis_0 = const()[name = tensor("op_9233_axis_0"), val = tensor(1)]; + tensor var_9233_cast_fp16_0, tensor var_9233_cast_fp16_1 = split(axis = var_9233_axis_0, split_sizes = var_9233_split_sizes_0, x = var_9232_cast_fp16)[name = tensor("op_9233_cast_fp16")]; + tensor var_9235_mode_0 = const()[name = tensor("op_9235_mode_0"), val = tensor("EXACT")]; + tensor var_9235_cast_fp16 = gelu(mode = var_9235_mode_0, x = var_9233_cast_fp16_1)[name = tensor("op_9235_cast_fp16")]; + tensor input_389_cast_fp16 = mul(x = var_9233_cast_fp16_0, y = var_9235_cast_fp16)[name = tensor("input_389_cast_fp16")]; + tensor var_9239 = const()[name = tensor("op_9239"), val = tensor([1, 1])]; + tensor var_9241 = const()[name = tensor("op_9241"), val = tensor([1, 1])]; + tensor var_9243_pad_type_0 = const()[name = tensor("op_9243_pad_type_0"), val = tensor("custom")]; + tensor var_9243_pad_0 = const()[name = tensor("op_9243_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1596996032)))]; + tensor up_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1600272896)))]; + tensor var_9243_cast_fp16 = conv(bias = up_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_9241, groups = var_8627, pad = var_9243_pad_0, pad_type = var_9243_pad_type_0, strides = var_9239, weight = up_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_389_cast_fp16)[name = tensor("op_9243_cast_fp16")]; + tensor hidden_states_233_cast_fp16 = add(x = var_9243_cast_fp16, y = inputs_65_cast_fp16)[name = tensor("hidden_states_233_cast_fp16")]; + tensor var_9245 = const()[name = tensor("op_9245"), val = tensor([2, 640, 24, 24])]; + tensor input_391_cast_fp16 = reshape(shape = var_9245, x = hidden_states_233_cast_fp16)[name = tensor("input_391_cast_fp16")]; + tensor var_9249 = const()[name = tensor("op_9249"), val = tensor([1, 1])]; + tensor var_9251 = const()[name = tensor("op_9251"), val = tensor([1, 1])]; + tensor hidden_states_235_pad_type_0 = const()[name = tensor("hidden_states_235_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_235_pad_0 = const()[name = tensor("hidden_states_235_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_0_proj_out_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1600274240)))]; + tensor up_blocks_2_attentions_0_proj_out_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_0_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1601093504)))]; + tensor hidden_states_235_cast_fp16 = conv(bias = up_blocks_2_attentions_0_proj_out_bias_to_fp16, dilations = var_9251, groups = var_8627, pad = hidden_states_235_pad_0, pad_type = hidden_states_235_pad_type_0, strides = var_9249, weight = up_blocks_2_attentions_0_proj_out_weight_to_fp16, x = input_391_cast_fp16)[name = tensor("hidden_states_235_cast_fp16")]; + tensor hidden_states_237_cast_fp16 = add(x = hidden_states_235_cast_fp16, y = hidden_states_223_cast_fp16)[name = tensor("hidden_states_237_cast_fp16")]; + tensor input_393_interleave_0 = const()[name = tensor("input_393_interleave_0"), val = tensor(false)]; + tensor input_393_cast_fp16 = concat(axis = var_8627, interleave = input_393_interleave_0, values = (hidden_states_237_cast_fp16, input_89_cast_fp16))[name = tensor("input_393_cast_fp16")]; + tensor reshape_180_shape_0 = const()[name = tensor("reshape_180_shape_0"), val = tensor([2, 32, 40, 24, 24])]; + tensor reshape_180_cast_fp16 = reshape(shape = reshape_180_shape_0, x = input_393_cast_fp16)[name = tensor("reshape_180_cast_fp16")]; + tensor reduce_mean_135_axes_0 = const()[name = tensor("reduce_mean_135_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_135_keep_dims_0 = const()[name = tensor("reduce_mean_135_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_135_cast_fp16 = reduce_mean(axes = reduce_mean_135_axes_0, keep_dims = reduce_mean_135_keep_dims_0, x = reshape_180_cast_fp16)[name = tensor("reduce_mean_135_cast_fp16")]; + tensor sub_90_cast_fp16 = sub(x = reshape_180_cast_fp16, y = reduce_mean_135_cast_fp16)[name = tensor("sub_90_cast_fp16")]; + tensor square_45_cast_fp16 = square(x = sub_90_cast_fp16)[name = tensor("square_45_cast_fp16")]; + tensor reduce_mean_137_axes_0 = const()[name = tensor("reduce_mean_137_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_137_keep_dims_0 = const()[name = tensor("reduce_mean_137_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_137_cast_fp16 = reduce_mean(axes = reduce_mean_137_axes_0, keep_dims = reduce_mean_137_keep_dims_0, x = square_45_cast_fp16)[name = tensor("reduce_mean_137_cast_fp16")]; + tensor add_90_y_0_to_fp16 = const()[name = tensor("add_90_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_90_cast_fp16 = add(x = reduce_mean_137_cast_fp16, y = add_90_y_0_to_fp16)[name = tensor("add_90_cast_fp16")]; + tensor sqrt_45_cast_fp16 = sqrt(x = add_90_cast_fp16)[name = tensor("sqrt_45_cast_fp16")]; + tensor real_div_45_cast_fp16 = real_div(x = sub_90_cast_fp16, y = sqrt_45_cast_fp16)[name = tensor("real_div_45_cast_fp16")]; + tensor reshape_181_shape_0 = const()[name = tensor("reshape_181_shape_0"), val = tensor([2, 1280, 24, 24])]; + tensor reshape_181_cast_fp16 = reshape(shape = reshape_181_shape_0, x = real_div_45_cast_fp16)[name = tensor("reshape_181_cast_fp16")]; + tensor add_91_gamma_0_to_fp16 = const()[name = tensor("add_91_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1601094848)))]; + tensor add_91_beta_0_to_fp16 = const()[name = tensor("add_91_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1601097472)))]; + tensor add_91_epsilon_0_to_fp16 = const()[name = tensor("add_91_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_91_cast_fp16 = batch_norm(beta = add_91_beta_0_to_fp16, epsilon = add_91_epsilon_0_to_fp16, gamma = add_91_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_181_cast_fp16)[name = tensor("add_91_cast_fp16")]; + tensor input_397_cast_fp16 = silu(x = add_91_cast_fp16)[name = tensor("input_397_cast_fp16")]; + tensor var_9269 = const()[name = tensor("op_9269"), val = tensor([1, 1])]; + tensor var_9271 = const()[name = tensor("op_9271"), val = tensor([1, 1])]; + tensor hidden_states_239_pad_type_0 = const()[name = tensor("hidden_states_239_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_239_pad_0 = const()[name = tensor("hidden_states_239_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_2_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1601100096)))]; + tensor up_blocks_2_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1615845760)))]; + tensor hidden_states_239_cast_fp16 = conv(bias = up_blocks_2_resnets_1_conv1_bias_to_fp16, dilations = var_9271, groups = var_8627, pad = hidden_states_239_pad_0, pad_type = hidden_states_239_pad_type_0, strides = var_9269, weight = up_blocks_2_resnets_1_conv1_weight_to_fp16, x = input_397_cast_fp16)[name = tensor("hidden_states_239_cast_fp16")]; + tensor var_9277 = const()[name = tensor("op_9277"), val = tensor([1, 1])]; + tensor var_9279 = const()[name = tensor("op_9279"), val = tensor([1, 1])]; + tensor temb_35_pad_type_0 = const()[name = tensor("temb_35_pad_type_0"), val = tensor("custom")]; + tensor temb_35_pad_0 = const()[name = tensor("temb_35_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1615847104)))]; + tensor up_blocks_2_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1617485568)))]; + tensor temb_35_cast_fp16 = conv(bias = up_blocks_2_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_9279, groups = var_8627, pad = temb_35_pad_0, pad_type = temb_35_pad_type_0, strides = var_9277, weight = up_blocks_2_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_35_cast_fp16")]; + tensor input_401_cast_fp16 = add(x = hidden_states_239_cast_fp16, y = temb_35_cast_fp16)[name = tensor("input_401_cast_fp16")]; + tensor reshape_184_shape_0 = const()[name = tensor("reshape_184_shape_0"), val = tensor([2, 32, 20, 24, 24])]; + tensor reshape_184_cast_fp16 = reshape(shape = reshape_184_shape_0, x = input_401_cast_fp16)[name = tensor("reshape_184_cast_fp16")]; + tensor reduce_mean_138_axes_0 = const()[name = tensor("reduce_mean_138_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_138_keep_dims_0 = const()[name = tensor("reduce_mean_138_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_138_cast_fp16 = reduce_mean(axes = reduce_mean_138_axes_0, keep_dims = reduce_mean_138_keep_dims_0, x = reshape_184_cast_fp16)[name = tensor("reduce_mean_138_cast_fp16")]; + tensor sub_92_cast_fp16 = sub(x = reshape_184_cast_fp16, y = reduce_mean_138_cast_fp16)[name = tensor("sub_92_cast_fp16")]; + tensor square_46_cast_fp16 = square(x = sub_92_cast_fp16)[name = tensor("square_46_cast_fp16")]; + tensor reduce_mean_140_axes_0 = const()[name = tensor("reduce_mean_140_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_140_keep_dims_0 = const()[name = tensor("reduce_mean_140_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_140_cast_fp16 = reduce_mean(axes = reduce_mean_140_axes_0, keep_dims = reduce_mean_140_keep_dims_0, x = square_46_cast_fp16)[name = tensor("reduce_mean_140_cast_fp16")]; + tensor add_92_y_0_to_fp16 = const()[name = tensor("add_92_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_92_cast_fp16 = add(x = reduce_mean_140_cast_fp16, y = add_92_y_0_to_fp16)[name = tensor("add_92_cast_fp16")]; + tensor sqrt_46_cast_fp16 = sqrt(x = add_92_cast_fp16)[name = tensor("sqrt_46_cast_fp16")]; + tensor real_div_46_cast_fp16 = real_div(x = sub_92_cast_fp16, y = sqrt_46_cast_fp16)[name = tensor("real_div_46_cast_fp16")]; + tensor reshape_185_shape_0 = const()[name = tensor("reshape_185_shape_0"), val = tensor([2, 640, 24, 24])]; + tensor reshape_185_cast_fp16 = reshape(shape = reshape_185_shape_0, x = real_div_46_cast_fp16)[name = tensor("reshape_185_cast_fp16")]; + tensor add_93_gamma_0_to_fp16 = const()[name = tensor("add_93_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1617486912)))]; + tensor add_93_beta_0_to_fp16 = const()[name = tensor("add_93_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1617488256)))]; + tensor add_93_epsilon_0_to_fp16 = const()[name = tensor("add_93_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_93_cast_fp16 = batch_norm(beta = add_93_beta_0_to_fp16, epsilon = add_93_epsilon_0_to_fp16, gamma = add_93_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_185_cast_fp16)[name = tensor("add_93_cast_fp16")]; + tensor input_405_cast_fp16 = silu(x = add_93_cast_fp16)[name = tensor("input_405_cast_fp16")]; + tensor var_9289 = const()[name = tensor("op_9289"), val = tensor([1, 1])]; + tensor var_9291 = const()[name = tensor("op_9291"), val = tensor([1, 1])]; + tensor hidden_states_241_pad_type_0 = const()[name = tensor("hidden_states_241_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_241_pad_0 = const()[name = tensor("hidden_states_241_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_2_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1617489600)))]; + tensor up_blocks_2_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1624862464)))]; + tensor hidden_states_241_cast_fp16 = conv(bias = up_blocks_2_resnets_1_conv2_bias_to_fp16, dilations = var_9291, groups = var_8627, pad = hidden_states_241_pad_0, pad_type = hidden_states_241_pad_type_0, strides = var_9289, weight = up_blocks_2_resnets_1_conv2_weight_to_fp16, x = input_405_cast_fp16)[name = tensor("hidden_states_241_cast_fp16")]; + tensor var_9296 = const()[name = tensor("op_9296"), val = tensor([1, 1])]; + tensor var_9298 = const()[name = tensor("op_9298"), val = tensor([1, 1])]; + tensor x_19_pad_type_0 = const()[name = tensor("x_19_pad_type_0"), val = tensor("custom")]; + tensor x_19_pad_0 = const()[name = tensor("x_19_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_resnets_1_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_1_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1624863808)))]; + tensor up_blocks_2_resnets_1_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_1_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1626502272)))]; + tensor x_19_cast_fp16 = conv(bias = up_blocks_2_resnets_1_conv_shortcut_bias_to_fp16, dilations = var_9298, groups = var_8627, pad = x_19_pad_0, pad_type = x_19_pad_type_0, strides = var_9296, weight = up_blocks_2_resnets_1_conv_shortcut_weight_to_fp16, x = input_393_cast_fp16)[name = tensor("x_19_cast_fp16")]; + tensor hidden_states_243_cast_fp16 = add(x = x_19_cast_fp16, y = hidden_states_241_cast_fp16)[name = tensor("hidden_states_243_cast_fp16")]; + tensor reshape_188_shape_0 = const()[name = tensor("reshape_188_shape_0"), val = tensor([2, 32, 20, 24, 24])]; + tensor reshape_188_cast_fp16 = reshape(shape = reshape_188_shape_0, x = hidden_states_243_cast_fp16)[name = tensor("reshape_188_cast_fp16")]; + tensor reduce_mean_141_axes_0 = const()[name = tensor("reduce_mean_141_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_141_keep_dims_0 = const()[name = tensor("reduce_mean_141_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_141_cast_fp16 = reduce_mean(axes = reduce_mean_141_axes_0, keep_dims = reduce_mean_141_keep_dims_0, x = reshape_188_cast_fp16)[name = tensor("reduce_mean_141_cast_fp16")]; + tensor sub_94_cast_fp16 = sub(x = reshape_188_cast_fp16, y = reduce_mean_141_cast_fp16)[name = tensor("sub_94_cast_fp16")]; + tensor square_47_cast_fp16 = square(x = sub_94_cast_fp16)[name = tensor("square_47_cast_fp16")]; + tensor reduce_mean_143_axes_0 = const()[name = tensor("reduce_mean_143_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_143_keep_dims_0 = const()[name = tensor("reduce_mean_143_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_143_cast_fp16 = reduce_mean(axes = reduce_mean_143_axes_0, keep_dims = reduce_mean_143_keep_dims_0, x = square_47_cast_fp16)[name = tensor("reduce_mean_143_cast_fp16")]; + tensor add_94_y_0_to_fp16 = const()[name = tensor("add_94_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_94_cast_fp16 = add(x = reduce_mean_143_cast_fp16, y = add_94_y_0_to_fp16)[name = tensor("add_94_cast_fp16")]; + tensor sqrt_47_cast_fp16 = sqrt(x = add_94_cast_fp16)[name = tensor("sqrt_47_cast_fp16")]; + tensor real_div_47_cast_fp16 = real_div(x = sub_94_cast_fp16, y = sqrt_47_cast_fp16)[name = tensor("real_div_47_cast_fp16")]; + tensor reshape_189_shape_0 = const()[name = tensor("reshape_189_shape_0"), val = tensor([2, 640, 24, 24])]; + tensor reshape_189_cast_fp16 = reshape(shape = reshape_189_shape_0, x = real_div_47_cast_fp16)[name = tensor("reshape_189_cast_fp16")]; + tensor add_95_gamma_0_to_fp16 = const()[name = tensor("add_95_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1626503616)))]; + tensor add_95_beta_0_to_fp16 = const()[name = tensor("add_95_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1626504960)))]; + tensor add_95_epsilon_0_to_fp16 = const()[name = tensor("add_95_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_95_cast_fp16 = batch_norm(beta = add_95_beta_0_to_fp16, epsilon = add_95_epsilon_0_to_fp16, gamma = add_95_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_189_cast_fp16)[name = tensor("add_95_cast_fp16")]; + tensor var_9318 = const()[name = tensor("op_9318"), val = tensor([1, 1])]; + tensor var_9320 = const()[name = tensor("op_9320"), val = tensor([1, 1])]; + tensor hidden_states_245_pad_type_0 = const()[name = tensor("hidden_states_245_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_245_pad_0 = const()[name = tensor("hidden_states_245_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_proj_in_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1626506304)))]; + tensor up_blocks_2_attentions_1_proj_in_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1627325568)))]; + tensor hidden_states_245_cast_fp16 = conv(bias = up_blocks_2_attentions_1_proj_in_bias_to_fp16, dilations = var_9320, groups = var_8627, pad = hidden_states_245_pad_0, pad_type = hidden_states_245_pad_type_0, strides = var_9318, weight = up_blocks_2_attentions_1_proj_in_weight_to_fp16, x = add_95_cast_fp16)[name = tensor("hidden_states_245_cast_fp16")]; + tensor var_9325 = const()[name = tensor("op_9325"), val = tensor([2, 640, 1, 576])]; + tensor inputs_67_cast_fp16 = reshape(shape = var_9325, x = hidden_states_245_cast_fp16)[name = tensor("inputs_67_cast_fp16")]; + tensor var_9335 = const()[name = tensor("op_9335"), val = tensor([1])]; + tensor channels_mean_67_cast_fp16 = reduce_mean(axes = var_9335, keep_dims = var_8622, x = inputs_67_cast_fp16)[name = tensor("channels_mean_67_cast_fp16")]; + tensor zero_mean_67_cast_fp16 = sub(x = inputs_67_cast_fp16, y = channels_mean_67_cast_fp16)[name = tensor("zero_mean_67_cast_fp16")]; + tensor zero_mean_sq_67_cast_fp16 = mul(x = zero_mean_67_cast_fp16, y = zero_mean_67_cast_fp16)[name = tensor("zero_mean_sq_67_cast_fp16")]; + tensor var_9339 = const()[name = tensor("op_9339"), val = tensor([1])]; + tensor var_9340_cast_fp16 = reduce_mean(axes = var_9339, keep_dims = var_8622, x = zero_mean_sq_67_cast_fp16)[name = tensor("op_9340_cast_fp16")]; + tensor var_9341_to_fp16 = const()[name = tensor("op_9341_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_9342_cast_fp16 = add(x = var_9340_cast_fp16, y = var_9341_to_fp16)[name = tensor("op_9342_cast_fp16")]; + tensor denom_67_epsilon_0_to_fp16 = const()[name = tensor("denom_67_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_67_cast_fp16 = rsqrt(epsilon = denom_67_epsilon_0_to_fp16, x = var_9342_cast_fp16)[name = tensor("denom_67_cast_fp16")]; + tensor out_67_cast_fp16 = mul(x = zero_mean_67_cast_fp16, y = denom_67_cast_fp16)[name = tensor("out_67_cast_fp16")]; + tensor var_9346_to_fp16 = const()[name = tensor("op_9346_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1627326912)))]; + tensor var_9347_cast_fp16 = add(x = out_67_cast_fp16, y = var_9346_to_fp16)[name = tensor("op_9347_cast_fp16")]; + tensor var_9349_to_fp16 = const()[name = tensor("op_9349_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1627328256)))]; + tensor hidden_states_247_cast_fp16 = mul(x = var_9347_cast_fp16, y = var_9349_to_fp16)[name = tensor("hidden_states_247_cast_fp16")]; + tensor var_9356 = const()[name = tensor("op_9356"), val = tensor([1, 1])]; + tensor var_9358 = const()[name = tensor("op_9358"), val = tensor([1, 1])]; + tensor q_45_pad_type_0 = const()[name = tensor("q_45_pad_type_0"), val = tensor("custom")]; + tensor q_45_pad_0 = const()[name = tensor("q_45_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1627329600)))]; + tensor q_45_cast_fp16 = conv(dilations = var_9358, groups = var_8627, pad = q_45_pad_0, pad_type = q_45_pad_type_0, strides = var_9356, weight = up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_247_cast_fp16)[name = tensor("q_45_cast_fp16")]; + tensor var_9362 = const()[name = tensor("op_9362"), val = tensor([1, 1])]; + tensor var_9364 = const()[name = tensor("op_9364"), val = tensor([1, 1])]; + tensor k_89_pad_type_0 = const()[name = tensor("k_89_pad_type_0"), val = tensor("custom")]; + tensor k_89_pad_0 = const()[name = tensor("k_89_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1628148864)))]; + tensor k_89_cast_fp16 = conv(dilations = var_9364, groups = var_8627, pad = k_89_pad_0, pad_type = k_89_pad_type_0, strides = var_9362, weight = up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_247_cast_fp16)[name = tensor("k_89_cast_fp16")]; + tensor var_9368 = const()[name = tensor("op_9368"), val = tensor([1, 1])]; + tensor var_9370 = const()[name = tensor("op_9370"), val = tensor([1, 1])]; + tensor v_45_pad_type_0 = const()[name = tensor("v_45_pad_type_0"), val = tensor("custom")]; + tensor v_45_pad_0 = const()[name = tensor("v_45_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1628968128)))]; + tensor v_45_cast_fp16 = conv(dilations = var_9370, groups = var_8627, pad = v_45_pad_0, pad_type = v_45_pad_type_0, strides = var_9368, weight = up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_247_cast_fp16)[name = tensor("v_45_cast_fp16")]; + tensor var_9374_begin_0 = const()[name = tensor("op_9374_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_9374_end_0 = const()[name = tensor("op_9374_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_9374_end_mask_0 = const()[name = tensor("op_9374_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9374_cast_fp16 = slice_by_index(begin = var_9374_begin_0, end = var_9374_end_0, end_mask = var_9374_end_mask_0, x = q_45_cast_fp16)[name = tensor("op_9374_cast_fp16")]; + tensor var_9378_begin_0 = const()[name = tensor("op_9378_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_9378_end_0 = const()[name = tensor("op_9378_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_9378_end_mask_0 = const()[name = tensor("op_9378_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9378_cast_fp16 = slice_by_index(begin = var_9378_begin_0, end = var_9378_end_0, end_mask = var_9378_end_mask_0, x = q_45_cast_fp16)[name = tensor("op_9378_cast_fp16")]; + tensor var_9382_begin_0 = const()[name = tensor("op_9382_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_9382_end_0 = const()[name = tensor("op_9382_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_9382_end_mask_0 = const()[name = tensor("op_9382_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9382_cast_fp16 = slice_by_index(begin = var_9382_begin_0, end = var_9382_end_0, end_mask = var_9382_end_mask_0, x = q_45_cast_fp16)[name = tensor("op_9382_cast_fp16")]; + tensor var_9386_begin_0 = const()[name = tensor("op_9386_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_9386_end_0 = const()[name = tensor("op_9386_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_9386_end_mask_0 = const()[name = tensor("op_9386_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9386_cast_fp16 = slice_by_index(begin = var_9386_begin_0, end = var_9386_end_0, end_mask = var_9386_end_mask_0, x = q_45_cast_fp16)[name = tensor("op_9386_cast_fp16")]; + tensor var_9390_begin_0 = const()[name = tensor("op_9390_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_9390_end_0 = const()[name = tensor("op_9390_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_9390_end_mask_0 = const()[name = tensor("op_9390_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9390_cast_fp16 = slice_by_index(begin = var_9390_begin_0, end = var_9390_end_0, end_mask = var_9390_end_mask_0, x = q_45_cast_fp16)[name = tensor("op_9390_cast_fp16")]; + tensor var_9394_begin_0 = const()[name = tensor("op_9394_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_9394_end_0 = const()[name = tensor("op_9394_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_9394_end_mask_0 = const()[name = tensor("op_9394_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9394_cast_fp16 = slice_by_index(begin = var_9394_begin_0, end = var_9394_end_0, end_mask = var_9394_end_mask_0, x = q_45_cast_fp16)[name = tensor("op_9394_cast_fp16")]; + tensor var_9398_begin_0 = const()[name = tensor("op_9398_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_9398_end_0 = const()[name = tensor("op_9398_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_9398_end_mask_0 = const()[name = tensor("op_9398_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9398_cast_fp16 = slice_by_index(begin = var_9398_begin_0, end = var_9398_end_0, end_mask = var_9398_end_mask_0, x = q_45_cast_fp16)[name = tensor("op_9398_cast_fp16")]; + tensor var_9402_begin_0 = const()[name = tensor("op_9402_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_9402_end_0 = const()[name = tensor("op_9402_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_9402_end_mask_0 = const()[name = tensor("op_9402_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9402_cast_fp16 = slice_by_index(begin = var_9402_begin_0, end = var_9402_end_0, end_mask = var_9402_end_mask_0, x = q_45_cast_fp16)[name = tensor("op_9402_cast_fp16")]; + tensor var_9406_begin_0 = const()[name = tensor("op_9406_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_9406_end_0 = const()[name = tensor("op_9406_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_9406_end_mask_0 = const()[name = tensor("op_9406_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9406_cast_fp16 = slice_by_index(begin = var_9406_begin_0, end = var_9406_end_0, end_mask = var_9406_end_mask_0, x = q_45_cast_fp16)[name = tensor("op_9406_cast_fp16")]; + tensor var_9410_begin_0 = const()[name = tensor("op_9410_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_9410_end_0 = const()[name = tensor("op_9410_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_9410_end_mask_0 = const()[name = tensor("op_9410_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9410_cast_fp16 = slice_by_index(begin = var_9410_begin_0, end = var_9410_end_0, end_mask = var_9410_end_mask_0, x = q_45_cast_fp16)[name = tensor("op_9410_cast_fp16")]; + tensor k_91_perm_0 = const()[name = tensor("k_91_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_9417_begin_0 = const()[name = tensor("op_9417_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_9417_end_0 = const()[name = tensor("op_9417_end_0"), val = tensor([2, 576, 1, 64])]; + tensor var_9417_end_mask_0 = const()[name = tensor("op_9417_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_9 = transpose(perm = k_91_perm_0, x = k_89_cast_fp16)[name = tensor("transpose_9")]; + tensor var_9417_cast_fp16 = slice_by_index(begin = var_9417_begin_0, end = var_9417_end_0, end_mask = var_9417_end_mask_0, x = transpose_9)[name = tensor("op_9417_cast_fp16")]; + tensor var_9421_begin_0 = const()[name = tensor("op_9421_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_9421_end_0 = const()[name = tensor("op_9421_end_0"), val = tensor([2, 576, 1, 128])]; + tensor var_9421_end_mask_0 = const()[name = tensor("op_9421_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9421_cast_fp16 = slice_by_index(begin = var_9421_begin_0, end = var_9421_end_0, end_mask = var_9421_end_mask_0, x = transpose_9)[name = tensor("op_9421_cast_fp16")]; + tensor var_9425_begin_0 = const()[name = tensor("op_9425_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_9425_end_0 = const()[name = tensor("op_9425_end_0"), val = tensor([2, 576, 1, 192])]; + tensor var_9425_end_mask_0 = const()[name = tensor("op_9425_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9425_cast_fp16 = slice_by_index(begin = var_9425_begin_0, end = var_9425_end_0, end_mask = var_9425_end_mask_0, x = transpose_9)[name = tensor("op_9425_cast_fp16")]; + tensor var_9429_begin_0 = const()[name = tensor("op_9429_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_9429_end_0 = const()[name = tensor("op_9429_end_0"), val = tensor([2, 576, 1, 256])]; + tensor var_9429_end_mask_0 = const()[name = tensor("op_9429_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9429_cast_fp16 = slice_by_index(begin = var_9429_begin_0, end = var_9429_end_0, end_mask = var_9429_end_mask_0, x = transpose_9)[name = tensor("op_9429_cast_fp16")]; + tensor var_9433_begin_0 = const()[name = tensor("op_9433_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_9433_end_0 = const()[name = tensor("op_9433_end_0"), val = tensor([2, 576, 1, 320])]; + tensor var_9433_end_mask_0 = const()[name = tensor("op_9433_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9433_cast_fp16 = slice_by_index(begin = var_9433_begin_0, end = var_9433_end_0, end_mask = var_9433_end_mask_0, x = transpose_9)[name = tensor("op_9433_cast_fp16")]; + tensor var_9437_begin_0 = const()[name = tensor("op_9437_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_9437_end_0 = const()[name = tensor("op_9437_end_0"), val = tensor([2, 576, 1, 384])]; + tensor var_9437_end_mask_0 = const()[name = tensor("op_9437_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9437_cast_fp16 = slice_by_index(begin = var_9437_begin_0, end = var_9437_end_0, end_mask = var_9437_end_mask_0, x = transpose_9)[name = tensor("op_9437_cast_fp16")]; + tensor var_9441_begin_0 = const()[name = tensor("op_9441_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_9441_end_0 = const()[name = tensor("op_9441_end_0"), val = tensor([2, 576, 1, 448])]; + tensor var_9441_end_mask_0 = const()[name = tensor("op_9441_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9441_cast_fp16 = slice_by_index(begin = var_9441_begin_0, end = var_9441_end_0, end_mask = var_9441_end_mask_0, x = transpose_9)[name = tensor("op_9441_cast_fp16")]; + tensor var_9445_begin_0 = const()[name = tensor("op_9445_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_9445_end_0 = const()[name = tensor("op_9445_end_0"), val = tensor([2, 576, 1, 512])]; + tensor var_9445_end_mask_0 = const()[name = tensor("op_9445_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9445_cast_fp16 = slice_by_index(begin = var_9445_begin_0, end = var_9445_end_0, end_mask = var_9445_end_mask_0, x = transpose_9)[name = tensor("op_9445_cast_fp16")]; + tensor var_9449_begin_0 = const()[name = tensor("op_9449_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_9449_end_0 = const()[name = tensor("op_9449_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_9449_end_mask_0 = const()[name = tensor("op_9449_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9449_cast_fp16 = slice_by_index(begin = var_9449_begin_0, end = var_9449_end_0, end_mask = var_9449_end_mask_0, x = transpose_9)[name = tensor("op_9449_cast_fp16")]; + tensor var_9453_begin_0 = const()[name = tensor("op_9453_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_9453_end_0 = const()[name = tensor("op_9453_end_0"), val = tensor([2, 576, 1, 640])]; + tensor var_9453_end_mask_0 = const()[name = tensor("op_9453_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9453_cast_fp16 = slice_by_index(begin = var_9453_begin_0, end = var_9453_end_0, end_mask = var_9453_end_mask_0, x = transpose_9)[name = tensor("op_9453_cast_fp16")]; + tensor var_9455_begin_0 = const()[name = tensor("op_9455_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_9455_end_0 = const()[name = tensor("op_9455_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_9455_end_mask_0 = const()[name = tensor("op_9455_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9455_cast_fp16 = slice_by_index(begin = var_9455_begin_0, end = var_9455_end_0, end_mask = var_9455_end_mask_0, x = v_45_cast_fp16)[name = tensor("op_9455_cast_fp16")]; + tensor var_9459_begin_0 = const()[name = tensor("op_9459_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_9459_end_0 = const()[name = tensor("op_9459_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_9459_end_mask_0 = const()[name = tensor("op_9459_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9459_cast_fp16 = slice_by_index(begin = var_9459_begin_0, end = var_9459_end_0, end_mask = var_9459_end_mask_0, x = v_45_cast_fp16)[name = tensor("op_9459_cast_fp16")]; + tensor var_9463_begin_0 = const()[name = tensor("op_9463_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_9463_end_0 = const()[name = tensor("op_9463_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_9463_end_mask_0 = const()[name = tensor("op_9463_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9463_cast_fp16 = slice_by_index(begin = var_9463_begin_0, end = var_9463_end_0, end_mask = var_9463_end_mask_0, x = v_45_cast_fp16)[name = tensor("op_9463_cast_fp16")]; + tensor var_9467_begin_0 = const()[name = tensor("op_9467_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_9467_end_0 = const()[name = tensor("op_9467_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_9467_end_mask_0 = const()[name = tensor("op_9467_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9467_cast_fp16 = slice_by_index(begin = var_9467_begin_0, end = var_9467_end_0, end_mask = var_9467_end_mask_0, x = v_45_cast_fp16)[name = tensor("op_9467_cast_fp16")]; + tensor var_9471_begin_0 = const()[name = tensor("op_9471_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_9471_end_0 = const()[name = tensor("op_9471_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_9471_end_mask_0 = const()[name = tensor("op_9471_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9471_cast_fp16 = slice_by_index(begin = var_9471_begin_0, end = var_9471_end_0, end_mask = var_9471_end_mask_0, x = v_45_cast_fp16)[name = tensor("op_9471_cast_fp16")]; + tensor var_9475_begin_0 = const()[name = tensor("op_9475_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_9475_end_0 = const()[name = tensor("op_9475_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_9475_end_mask_0 = const()[name = tensor("op_9475_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9475_cast_fp16 = slice_by_index(begin = var_9475_begin_0, end = var_9475_end_0, end_mask = var_9475_end_mask_0, x = v_45_cast_fp16)[name = tensor("op_9475_cast_fp16")]; + tensor var_9479_begin_0 = const()[name = tensor("op_9479_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_9479_end_0 = const()[name = tensor("op_9479_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_9479_end_mask_0 = const()[name = tensor("op_9479_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9479_cast_fp16 = slice_by_index(begin = var_9479_begin_0, end = var_9479_end_0, end_mask = var_9479_end_mask_0, x = v_45_cast_fp16)[name = tensor("op_9479_cast_fp16")]; + tensor var_9483_begin_0 = const()[name = tensor("op_9483_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_9483_end_0 = const()[name = tensor("op_9483_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_9483_end_mask_0 = const()[name = tensor("op_9483_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9483_cast_fp16 = slice_by_index(begin = var_9483_begin_0, end = var_9483_end_0, end_mask = var_9483_end_mask_0, x = v_45_cast_fp16)[name = tensor("op_9483_cast_fp16")]; + tensor var_9487_begin_0 = const()[name = tensor("op_9487_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_9487_end_0 = const()[name = tensor("op_9487_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_9487_end_mask_0 = const()[name = tensor("op_9487_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9487_cast_fp16 = slice_by_index(begin = var_9487_begin_0, end = var_9487_end_0, end_mask = var_9487_end_mask_0, x = v_45_cast_fp16)[name = tensor("op_9487_cast_fp16")]; + tensor var_9491_begin_0 = const()[name = tensor("op_9491_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_9491_end_0 = const()[name = tensor("op_9491_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_9491_end_mask_0 = const()[name = tensor("op_9491_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9491_cast_fp16 = slice_by_index(begin = var_9491_begin_0, end = var_9491_end_0, end_mask = var_9491_end_mask_0, x = v_45_cast_fp16)[name = tensor("op_9491_cast_fp16")]; + tensor var_9495_equation_0 = const()[name = tensor("op_9495_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9495_cast_fp16 = einsum(equation = var_9495_equation_0, values = (var_9417_cast_fp16, var_9374_cast_fp16))[name = tensor("op_9495_cast_fp16")]; + tensor var_9496_to_fp16 = const()[name = tensor("op_9496_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_641_cast_fp16 = mul(x = var_9495_cast_fp16, y = var_9496_to_fp16)[name = tensor("aw_641_cast_fp16")]; + tensor var_9499_equation_0 = const()[name = tensor("op_9499_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9499_cast_fp16 = einsum(equation = var_9499_equation_0, values = (var_9421_cast_fp16, var_9378_cast_fp16))[name = tensor("op_9499_cast_fp16")]; + tensor var_9500_to_fp16 = const()[name = tensor("op_9500_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_643_cast_fp16 = mul(x = var_9499_cast_fp16, y = var_9500_to_fp16)[name = tensor("aw_643_cast_fp16")]; + tensor var_9503_equation_0 = const()[name = tensor("op_9503_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9503_cast_fp16 = einsum(equation = var_9503_equation_0, values = (var_9425_cast_fp16, var_9382_cast_fp16))[name = tensor("op_9503_cast_fp16")]; + tensor var_9504_to_fp16 = const()[name = tensor("op_9504_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_645_cast_fp16 = mul(x = var_9503_cast_fp16, y = var_9504_to_fp16)[name = tensor("aw_645_cast_fp16")]; + tensor var_9507_equation_0 = const()[name = tensor("op_9507_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9507_cast_fp16 = einsum(equation = var_9507_equation_0, values = (var_9429_cast_fp16, var_9386_cast_fp16))[name = tensor("op_9507_cast_fp16")]; + tensor var_9508_to_fp16 = const()[name = tensor("op_9508_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_647_cast_fp16 = mul(x = var_9507_cast_fp16, y = var_9508_to_fp16)[name = tensor("aw_647_cast_fp16")]; + tensor var_9511_equation_0 = const()[name = tensor("op_9511_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9511_cast_fp16 = einsum(equation = var_9511_equation_0, values = (var_9433_cast_fp16, var_9390_cast_fp16))[name = tensor("op_9511_cast_fp16")]; + tensor var_9512_to_fp16 = const()[name = tensor("op_9512_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_649_cast_fp16 = mul(x = var_9511_cast_fp16, y = var_9512_to_fp16)[name = tensor("aw_649_cast_fp16")]; + tensor var_9515_equation_0 = const()[name = tensor("op_9515_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9515_cast_fp16 = einsum(equation = var_9515_equation_0, values = (var_9437_cast_fp16, var_9394_cast_fp16))[name = tensor("op_9515_cast_fp16")]; + tensor var_9516_to_fp16 = const()[name = tensor("op_9516_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_651_cast_fp16 = mul(x = var_9515_cast_fp16, y = var_9516_to_fp16)[name = tensor("aw_651_cast_fp16")]; + tensor var_9519_equation_0 = const()[name = tensor("op_9519_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9519_cast_fp16 = einsum(equation = var_9519_equation_0, values = (var_9441_cast_fp16, var_9398_cast_fp16))[name = tensor("op_9519_cast_fp16")]; + tensor var_9520_to_fp16 = const()[name = tensor("op_9520_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_653_cast_fp16 = mul(x = var_9519_cast_fp16, y = var_9520_to_fp16)[name = tensor("aw_653_cast_fp16")]; + tensor var_9523_equation_0 = const()[name = tensor("op_9523_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9523_cast_fp16 = einsum(equation = var_9523_equation_0, values = (var_9445_cast_fp16, var_9402_cast_fp16))[name = tensor("op_9523_cast_fp16")]; + tensor var_9524_to_fp16 = const()[name = tensor("op_9524_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_655_cast_fp16 = mul(x = var_9523_cast_fp16, y = var_9524_to_fp16)[name = tensor("aw_655_cast_fp16")]; + tensor var_9527_equation_0 = const()[name = tensor("op_9527_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9527_cast_fp16 = einsum(equation = var_9527_equation_0, values = (var_9449_cast_fp16, var_9406_cast_fp16))[name = tensor("op_9527_cast_fp16")]; + tensor var_9528_to_fp16 = const()[name = tensor("op_9528_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_657_cast_fp16 = mul(x = var_9527_cast_fp16, y = var_9528_to_fp16)[name = tensor("aw_657_cast_fp16")]; + tensor var_9531_equation_0 = const()[name = tensor("op_9531_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9531_cast_fp16 = einsum(equation = var_9531_equation_0, values = (var_9453_cast_fp16, var_9410_cast_fp16))[name = tensor("op_9531_cast_fp16")]; + tensor var_9532_to_fp16 = const()[name = tensor("op_9532_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_659_cast_fp16 = mul(x = var_9531_cast_fp16, y = var_9532_to_fp16)[name = tensor("aw_659_cast_fp16")]; + tensor var_9534_cast_fp16 = softmax(axis = var_8627, x = aw_641_cast_fp16)[name = tensor("op_9534_cast_fp16")]; + tensor var_9535_cast_fp16 = softmax(axis = var_8627, x = aw_643_cast_fp16)[name = tensor("op_9535_cast_fp16")]; + tensor var_9536_cast_fp16 = softmax(axis = var_8627, x = aw_645_cast_fp16)[name = tensor("op_9536_cast_fp16")]; + tensor var_9537_cast_fp16 = softmax(axis = var_8627, x = aw_647_cast_fp16)[name = tensor("op_9537_cast_fp16")]; + tensor var_9538_cast_fp16 = softmax(axis = var_8627, x = aw_649_cast_fp16)[name = tensor("op_9538_cast_fp16")]; + tensor var_9539_cast_fp16 = softmax(axis = var_8627, x = aw_651_cast_fp16)[name = tensor("op_9539_cast_fp16")]; + tensor var_9540_cast_fp16 = softmax(axis = var_8627, x = aw_653_cast_fp16)[name = tensor("op_9540_cast_fp16")]; + tensor var_9541_cast_fp16 = softmax(axis = var_8627, x = aw_655_cast_fp16)[name = tensor("op_9541_cast_fp16")]; + tensor var_9542_cast_fp16 = softmax(axis = var_8627, x = aw_657_cast_fp16)[name = tensor("op_9542_cast_fp16")]; + tensor var_9543_cast_fp16 = softmax(axis = var_8627, x = aw_659_cast_fp16)[name = tensor("op_9543_cast_fp16")]; + tensor var_9545_equation_0 = const()[name = tensor("op_9545_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9545_cast_fp16 = einsum(equation = var_9545_equation_0, values = (var_9455_cast_fp16, var_9534_cast_fp16))[name = tensor("op_9545_cast_fp16")]; + tensor var_9547_equation_0 = const()[name = tensor("op_9547_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9547_cast_fp16 = einsum(equation = var_9547_equation_0, values = (var_9459_cast_fp16, var_9535_cast_fp16))[name = tensor("op_9547_cast_fp16")]; + tensor var_9549_equation_0 = const()[name = tensor("op_9549_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9549_cast_fp16 = einsum(equation = var_9549_equation_0, values = (var_9463_cast_fp16, var_9536_cast_fp16))[name = tensor("op_9549_cast_fp16")]; + tensor var_9551_equation_0 = const()[name = tensor("op_9551_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9551_cast_fp16 = einsum(equation = var_9551_equation_0, values = (var_9467_cast_fp16, var_9537_cast_fp16))[name = tensor("op_9551_cast_fp16")]; + tensor var_9553_equation_0 = const()[name = tensor("op_9553_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9553_cast_fp16 = einsum(equation = var_9553_equation_0, values = (var_9471_cast_fp16, var_9538_cast_fp16))[name = tensor("op_9553_cast_fp16")]; + tensor var_9555_equation_0 = const()[name = tensor("op_9555_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9555_cast_fp16 = einsum(equation = var_9555_equation_0, values = (var_9475_cast_fp16, var_9539_cast_fp16))[name = tensor("op_9555_cast_fp16")]; + tensor var_9557_equation_0 = const()[name = tensor("op_9557_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9557_cast_fp16 = einsum(equation = var_9557_equation_0, values = (var_9479_cast_fp16, var_9540_cast_fp16))[name = tensor("op_9557_cast_fp16")]; + tensor var_9559_equation_0 = const()[name = tensor("op_9559_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9559_cast_fp16 = einsum(equation = var_9559_equation_0, values = (var_9483_cast_fp16, var_9541_cast_fp16))[name = tensor("op_9559_cast_fp16")]; + tensor var_9561_equation_0 = const()[name = tensor("op_9561_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9561_cast_fp16 = einsum(equation = var_9561_equation_0, values = (var_9487_cast_fp16, var_9542_cast_fp16))[name = tensor("op_9561_cast_fp16")]; + tensor var_9563_equation_0 = const()[name = tensor("op_9563_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9563_cast_fp16 = einsum(equation = var_9563_equation_0, values = (var_9491_cast_fp16, var_9543_cast_fp16))[name = tensor("op_9563_cast_fp16")]; + tensor input_409_interleave_0 = const()[name = tensor("input_409_interleave_0"), val = tensor(false)]; + tensor input_409_cast_fp16 = concat(axis = var_8627, interleave = input_409_interleave_0, values = (var_9545_cast_fp16, var_9547_cast_fp16, var_9549_cast_fp16, var_9551_cast_fp16, var_9553_cast_fp16, var_9555_cast_fp16, var_9557_cast_fp16, var_9559_cast_fp16, var_9561_cast_fp16, var_9563_cast_fp16))[name = tensor("input_409_cast_fp16")]; + tensor var_9569 = const()[name = tensor("op_9569"), val = tensor([1, 1])]; + tensor var_9571 = const()[name = tensor("op_9571"), val = tensor([1, 1])]; + tensor var_9573_pad_type_0 = const()[name = tensor("op_9573_pad_type_0"), val = tensor("custom")]; + tensor var_9573_pad_0 = const()[name = tensor("op_9573_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1629787392)))]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1630606656)))]; + tensor var_9573_cast_fp16 = conv(bias = up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_9571, groups = var_8627, pad = var_9573_pad_0, pad_type = var_9573_pad_type_0, strides = var_9569, weight = up_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_409_cast_fp16)[name = tensor("op_9573_cast_fp16")]; + tensor inputs_69_cast_fp16 = add(x = var_9573_cast_fp16, y = inputs_67_cast_fp16)[name = tensor("inputs_69_cast_fp16")]; + tensor var_9577 = const()[name = tensor("op_9577"), val = tensor([1])]; + tensor channels_mean_69_cast_fp16 = reduce_mean(axes = var_9577, keep_dims = var_8622, x = inputs_69_cast_fp16)[name = tensor("channels_mean_69_cast_fp16")]; + tensor zero_mean_69_cast_fp16 = sub(x = inputs_69_cast_fp16, y = channels_mean_69_cast_fp16)[name = tensor("zero_mean_69_cast_fp16")]; + tensor zero_mean_sq_69_cast_fp16 = mul(x = zero_mean_69_cast_fp16, y = zero_mean_69_cast_fp16)[name = tensor("zero_mean_sq_69_cast_fp16")]; + tensor var_9581 = const()[name = tensor("op_9581"), val = tensor([1])]; + tensor var_9582_cast_fp16 = reduce_mean(axes = var_9581, keep_dims = var_8622, x = zero_mean_sq_69_cast_fp16)[name = tensor("op_9582_cast_fp16")]; + tensor var_9583_to_fp16 = const()[name = tensor("op_9583_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_9584_cast_fp16 = add(x = var_9582_cast_fp16, y = var_9583_to_fp16)[name = tensor("op_9584_cast_fp16")]; + tensor denom_69_epsilon_0_to_fp16 = const()[name = tensor("denom_69_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_69_cast_fp16 = rsqrt(epsilon = denom_69_epsilon_0_to_fp16, x = var_9584_cast_fp16)[name = tensor("denom_69_cast_fp16")]; + tensor out_69_cast_fp16 = mul(x = zero_mean_69_cast_fp16, y = denom_69_cast_fp16)[name = tensor("out_69_cast_fp16")]; + tensor var_9588_to_fp16 = const()[name = tensor("op_9588_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1630608000)))]; + tensor var_9589_cast_fp16 = add(x = out_69_cast_fp16, y = var_9588_to_fp16)[name = tensor("op_9589_cast_fp16")]; + tensor var_9591_to_fp16 = const()[name = tensor("op_9591_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1630609344)))]; + tensor hidden_states_249_cast_fp16 = mul(x = var_9589_cast_fp16, y = var_9591_to_fp16)[name = tensor("hidden_states_249_cast_fp16")]; + tensor var_9598 = const()[name = tensor("op_9598"), val = tensor([1, 1])]; + tensor var_9600 = const()[name = tensor("op_9600"), val = tensor([1, 1])]; + tensor q_47_pad_type_0 = const()[name = tensor("q_47_pad_type_0"), val = tensor("custom")]; + tensor q_47_pad_0 = const()[name = tensor("q_47_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1630610688)))]; + tensor q_47_cast_fp16 = conv(dilations = var_9600, groups = var_8627, pad = q_47_pad_0, pad_type = q_47_pad_type_0, strides = var_9598, weight = up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_249_cast_fp16)[name = tensor("q_47_cast_fp16")]; + tensor var_9604 = const()[name = tensor("op_9604"), val = tensor([1, 1])]; + tensor var_9606 = const()[name = tensor("op_9606"), val = tensor([1, 1])]; + tensor k_93_pad_type_0 = const()[name = tensor("k_93_pad_type_0"), val = tensor("custom")]; + tensor k_93_pad_0 = const()[name = tensor("k_93_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1631429952)))]; + tensor k_93_cast_fp16 = conv(dilations = var_9606, groups = var_8627, pad = k_93_pad_0, pad_type = k_93_pad_type_0, strides = var_9604, weight = up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_93_cast_fp16")]; + tensor var_9610 = const()[name = tensor("op_9610"), val = tensor([1, 1])]; + tensor var_9612 = const()[name = tensor("op_9612"), val = tensor([1, 1])]; + tensor v_47_pad_type_0 = const()[name = tensor("v_47_pad_type_0"), val = tensor("custom")]; + tensor v_47_pad_0 = const()[name = tensor("v_47_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1632740736)))]; + tensor v_47_cast_fp16 = conv(dilations = var_9612, groups = var_8627, pad = v_47_pad_0, pad_type = v_47_pad_type_0, strides = var_9610, weight = up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_47_cast_fp16")]; + tensor var_9616_begin_0 = const()[name = tensor("op_9616_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_9616_end_0 = const()[name = tensor("op_9616_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_9616_end_mask_0 = const()[name = tensor("op_9616_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9616_cast_fp16 = slice_by_index(begin = var_9616_begin_0, end = var_9616_end_0, end_mask = var_9616_end_mask_0, x = q_47_cast_fp16)[name = tensor("op_9616_cast_fp16")]; + tensor var_9620_begin_0 = const()[name = tensor("op_9620_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_9620_end_0 = const()[name = tensor("op_9620_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_9620_end_mask_0 = const()[name = tensor("op_9620_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9620_cast_fp16 = slice_by_index(begin = var_9620_begin_0, end = var_9620_end_0, end_mask = var_9620_end_mask_0, x = q_47_cast_fp16)[name = tensor("op_9620_cast_fp16")]; + tensor var_9624_begin_0 = const()[name = tensor("op_9624_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_9624_end_0 = const()[name = tensor("op_9624_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_9624_end_mask_0 = const()[name = tensor("op_9624_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9624_cast_fp16 = slice_by_index(begin = var_9624_begin_0, end = var_9624_end_0, end_mask = var_9624_end_mask_0, x = q_47_cast_fp16)[name = tensor("op_9624_cast_fp16")]; + tensor var_9628_begin_0 = const()[name = tensor("op_9628_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_9628_end_0 = const()[name = tensor("op_9628_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_9628_end_mask_0 = const()[name = tensor("op_9628_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9628_cast_fp16 = slice_by_index(begin = var_9628_begin_0, end = var_9628_end_0, end_mask = var_9628_end_mask_0, x = q_47_cast_fp16)[name = tensor("op_9628_cast_fp16")]; + tensor var_9632_begin_0 = const()[name = tensor("op_9632_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_9632_end_0 = const()[name = tensor("op_9632_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_9632_end_mask_0 = const()[name = tensor("op_9632_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9632_cast_fp16 = slice_by_index(begin = var_9632_begin_0, end = var_9632_end_0, end_mask = var_9632_end_mask_0, x = q_47_cast_fp16)[name = tensor("op_9632_cast_fp16")]; + tensor var_9636_begin_0 = const()[name = tensor("op_9636_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_9636_end_0 = const()[name = tensor("op_9636_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_9636_end_mask_0 = const()[name = tensor("op_9636_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9636_cast_fp16 = slice_by_index(begin = var_9636_begin_0, end = var_9636_end_0, end_mask = var_9636_end_mask_0, x = q_47_cast_fp16)[name = tensor("op_9636_cast_fp16")]; + tensor var_9640_begin_0 = const()[name = tensor("op_9640_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_9640_end_0 = const()[name = tensor("op_9640_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_9640_end_mask_0 = const()[name = tensor("op_9640_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9640_cast_fp16 = slice_by_index(begin = var_9640_begin_0, end = var_9640_end_0, end_mask = var_9640_end_mask_0, x = q_47_cast_fp16)[name = tensor("op_9640_cast_fp16")]; + tensor var_9644_begin_0 = const()[name = tensor("op_9644_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_9644_end_0 = const()[name = tensor("op_9644_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_9644_end_mask_0 = const()[name = tensor("op_9644_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9644_cast_fp16 = slice_by_index(begin = var_9644_begin_0, end = var_9644_end_0, end_mask = var_9644_end_mask_0, x = q_47_cast_fp16)[name = tensor("op_9644_cast_fp16")]; + tensor var_9648_begin_0 = const()[name = tensor("op_9648_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_9648_end_0 = const()[name = tensor("op_9648_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_9648_end_mask_0 = const()[name = tensor("op_9648_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9648_cast_fp16 = slice_by_index(begin = var_9648_begin_0, end = var_9648_end_0, end_mask = var_9648_end_mask_0, x = q_47_cast_fp16)[name = tensor("op_9648_cast_fp16")]; + tensor var_9652_begin_0 = const()[name = tensor("op_9652_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_9652_end_0 = const()[name = tensor("op_9652_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_9652_end_mask_0 = const()[name = tensor("op_9652_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9652_cast_fp16 = slice_by_index(begin = var_9652_begin_0, end = var_9652_end_0, end_mask = var_9652_end_mask_0, x = q_47_cast_fp16)[name = tensor("op_9652_cast_fp16")]; + tensor k_95_perm_0 = const()[name = tensor("k_95_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_9659_begin_0 = const()[name = tensor("op_9659_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_9659_end_0 = const()[name = tensor("op_9659_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_9659_end_mask_0 = const()[name = tensor("op_9659_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_8 = transpose(perm = k_95_perm_0, x = k_93_cast_fp16)[name = tensor("transpose_8")]; + tensor var_9659_cast_fp16 = slice_by_index(begin = var_9659_begin_0, end = var_9659_end_0, end_mask = var_9659_end_mask_0, x = transpose_8)[name = tensor("op_9659_cast_fp16")]; + tensor var_9663_begin_0 = const()[name = tensor("op_9663_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_9663_end_0 = const()[name = tensor("op_9663_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_9663_end_mask_0 = const()[name = tensor("op_9663_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9663_cast_fp16 = slice_by_index(begin = var_9663_begin_0, end = var_9663_end_0, end_mask = var_9663_end_mask_0, x = transpose_8)[name = tensor("op_9663_cast_fp16")]; + tensor var_9667_begin_0 = const()[name = tensor("op_9667_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_9667_end_0 = const()[name = tensor("op_9667_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_9667_end_mask_0 = const()[name = tensor("op_9667_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9667_cast_fp16 = slice_by_index(begin = var_9667_begin_0, end = var_9667_end_0, end_mask = var_9667_end_mask_0, x = transpose_8)[name = tensor("op_9667_cast_fp16")]; + tensor var_9671_begin_0 = const()[name = tensor("op_9671_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_9671_end_0 = const()[name = tensor("op_9671_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_9671_end_mask_0 = const()[name = tensor("op_9671_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9671_cast_fp16 = slice_by_index(begin = var_9671_begin_0, end = var_9671_end_0, end_mask = var_9671_end_mask_0, x = transpose_8)[name = tensor("op_9671_cast_fp16")]; + tensor var_9675_begin_0 = const()[name = tensor("op_9675_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_9675_end_0 = const()[name = tensor("op_9675_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_9675_end_mask_0 = const()[name = tensor("op_9675_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9675_cast_fp16 = slice_by_index(begin = var_9675_begin_0, end = var_9675_end_0, end_mask = var_9675_end_mask_0, x = transpose_8)[name = tensor("op_9675_cast_fp16")]; + tensor var_9679_begin_0 = const()[name = tensor("op_9679_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_9679_end_0 = const()[name = tensor("op_9679_end_0"), val = tensor([2, 77, 1, 384])]; + tensor var_9679_end_mask_0 = const()[name = tensor("op_9679_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9679_cast_fp16 = slice_by_index(begin = var_9679_begin_0, end = var_9679_end_0, end_mask = var_9679_end_mask_0, x = transpose_8)[name = tensor("op_9679_cast_fp16")]; + tensor var_9683_begin_0 = const()[name = tensor("op_9683_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_9683_end_0 = const()[name = tensor("op_9683_end_0"), val = tensor([2, 77, 1, 448])]; + tensor var_9683_end_mask_0 = const()[name = tensor("op_9683_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9683_cast_fp16 = slice_by_index(begin = var_9683_begin_0, end = var_9683_end_0, end_mask = var_9683_end_mask_0, x = transpose_8)[name = tensor("op_9683_cast_fp16")]; + tensor var_9687_begin_0 = const()[name = tensor("op_9687_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_9687_end_0 = const()[name = tensor("op_9687_end_0"), val = tensor([2, 77, 1, 512])]; + tensor var_9687_end_mask_0 = const()[name = tensor("op_9687_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9687_cast_fp16 = slice_by_index(begin = var_9687_begin_0, end = var_9687_end_0, end_mask = var_9687_end_mask_0, x = transpose_8)[name = tensor("op_9687_cast_fp16")]; + tensor var_9691_begin_0 = const()[name = tensor("op_9691_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_9691_end_0 = const()[name = tensor("op_9691_end_0"), val = tensor([2, 77, 1, 576])]; + tensor var_9691_end_mask_0 = const()[name = tensor("op_9691_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9691_cast_fp16 = slice_by_index(begin = var_9691_begin_0, end = var_9691_end_0, end_mask = var_9691_end_mask_0, x = transpose_8)[name = tensor("op_9691_cast_fp16")]; + tensor var_9695_begin_0 = const()[name = tensor("op_9695_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_9695_end_0 = const()[name = tensor("op_9695_end_0"), val = tensor([2, 77, 1, 640])]; + tensor var_9695_end_mask_0 = const()[name = tensor("op_9695_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_9695_cast_fp16 = slice_by_index(begin = var_9695_begin_0, end = var_9695_end_0, end_mask = var_9695_end_mask_0, x = transpose_8)[name = tensor("op_9695_cast_fp16")]; + tensor var_9697_begin_0 = const()[name = tensor("op_9697_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_9697_end_0 = const()[name = tensor("op_9697_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_9697_end_mask_0 = const()[name = tensor("op_9697_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9697_cast_fp16 = slice_by_index(begin = var_9697_begin_0, end = var_9697_end_0, end_mask = var_9697_end_mask_0, x = v_47_cast_fp16)[name = tensor("op_9697_cast_fp16")]; + tensor var_9701_begin_0 = const()[name = tensor("op_9701_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_9701_end_0 = const()[name = tensor("op_9701_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_9701_end_mask_0 = const()[name = tensor("op_9701_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9701_cast_fp16 = slice_by_index(begin = var_9701_begin_0, end = var_9701_end_0, end_mask = var_9701_end_mask_0, x = v_47_cast_fp16)[name = tensor("op_9701_cast_fp16")]; + tensor var_9705_begin_0 = const()[name = tensor("op_9705_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_9705_end_0 = const()[name = tensor("op_9705_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_9705_end_mask_0 = const()[name = tensor("op_9705_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9705_cast_fp16 = slice_by_index(begin = var_9705_begin_0, end = var_9705_end_0, end_mask = var_9705_end_mask_0, x = v_47_cast_fp16)[name = tensor("op_9705_cast_fp16")]; + tensor var_9709_begin_0 = const()[name = tensor("op_9709_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_9709_end_0 = const()[name = tensor("op_9709_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_9709_end_mask_0 = const()[name = tensor("op_9709_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9709_cast_fp16 = slice_by_index(begin = var_9709_begin_0, end = var_9709_end_0, end_mask = var_9709_end_mask_0, x = v_47_cast_fp16)[name = tensor("op_9709_cast_fp16")]; + tensor var_9713_begin_0 = const()[name = tensor("op_9713_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_9713_end_0 = const()[name = tensor("op_9713_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_9713_end_mask_0 = const()[name = tensor("op_9713_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9713_cast_fp16 = slice_by_index(begin = var_9713_begin_0, end = var_9713_end_0, end_mask = var_9713_end_mask_0, x = v_47_cast_fp16)[name = tensor("op_9713_cast_fp16")]; + tensor var_9717_begin_0 = const()[name = tensor("op_9717_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_9717_end_0 = const()[name = tensor("op_9717_end_0"), val = tensor([2, 384, 1, 77])]; + tensor var_9717_end_mask_0 = const()[name = tensor("op_9717_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9717_cast_fp16 = slice_by_index(begin = var_9717_begin_0, end = var_9717_end_0, end_mask = var_9717_end_mask_0, x = v_47_cast_fp16)[name = tensor("op_9717_cast_fp16")]; + tensor var_9721_begin_0 = const()[name = tensor("op_9721_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_9721_end_0 = const()[name = tensor("op_9721_end_0"), val = tensor([2, 448, 1, 77])]; + tensor var_9721_end_mask_0 = const()[name = tensor("op_9721_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9721_cast_fp16 = slice_by_index(begin = var_9721_begin_0, end = var_9721_end_0, end_mask = var_9721_end_mask_0, x = v_47_cast_fp16)[name = tensor("op_9721_cast_fp16")]; + tensor var_9725_begin_0 = const()[name = tensor("op_9725_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_9725_end_0 = const()[name = tensor("op_9725_end_0"), val = tensor([2, 512, 1, 77])]; + tensor var_9725_end_mask_0 = const()[name = tensor("op_9725_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9725_cast_fp16 = slice_by_index(begin = var_9725_begin_0, end = var_9725_end_0, end_mask = var_9725_end_mask_0, x = v_47_cast_fp16)[name = tensor("op_9725_cast_fp16")]; + tensor var_9729_begin_0 = const()[name = tensor("op_9729_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_9729_end_0 = const()[name = tensor("op_9729_end_0"), val = tensor([2, 576, 1, 77])]; + tensor var_9729_end_mask_0 = const()[name = tensor("op_9729_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9729_cast_fp16 = slice_by_index(begin = var_9729_begin_0, end = var_9729_end_0, end_mask = var_9729_end_mask_0, x = v_47_cast_fp16)[name = tensor("op_9729_cast_fp16")]; + tensor var_9733_begin_0 = const()[name = tensor("op_9733_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_9733_end_0 = const()[name = tensor("op_9733_end_0"), val = tensor([2, 640, 1, 77])]; + tensor var_9733_end_mask_0 = const()[name = tensor("op_9733_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9733_cast_fp16 = slice_by_index(begin = var_9733_begin_0, end = var_9733_end_0, end_mask = var_9733_end_mask_0, x = v_47_cast_fp16)[name = tensor("op_9733_cast_fp16")]; + tensor var_9737_equation_0 = const()[name = tensor("op_9737_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9737_cast_fp16 = einsum(equation = var_9737_equation_0, values = (var_9659_cast_fp16, var_9616_cast_fp16))[name = tensor("op_9737_cast_fp16")]; + tensor var_9738_to_fp16 = const()[name = tensor("op_9738_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_661_cast_fp16 = mul(x = var_9737_cast_fp16, y = var_9738_to_fp16)[name = tensor("aw_661_cast_fp16")]; + tensor var_9741_equation_0 = const()[name = tensor("op_9741_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9741_cast_fp16 = einsum(equation = var_9741_equation_0, values = (var_9663_cast_fp16, var_9620_cast_fp16))[name = tensor("op_9741_cast_fp16")]; + tensor var_9742_to_fp16 = const()[name = tensor("op_9742_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_663_cast_fp16 = mul(x = var_9741_cast_fp16, y = var_9742_to_fp16)[name = tensor("aw_663_cast_fp16")]; + tensor var_9745_equation_0 = const()[name = tensor("op_9745_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9745_cast_fp16 = einsum(equation = var_9745_equation_0, values = (var_9667_cast_fp16, var_9624_cast_fp16))[name = tensor("op_9745_cast_fp16")]; + tensor var_9746_to_fp16 = const()[name = tensor("op_9746_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_665_cast_fp16 = mul(x = var_9745_cast_fp16, y = var_9746_to_fp16)[name = tensor("aw_665_cast_fp16")]; + tensor var_9749_equation_0 = const()[name = tensor("op_9749_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9749_cast_fp16 = einsum(equation = var_9749_equation_0, values = (var_9671_cast_fp16, var_9628_cast_fp16))[name = tensor("op_9749_cast_fp16")]; + tensor var_9750_to_fp16 = const()[name = tensor("op_9750_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_667_cast_fp16 = mul(x = var_9749_cast_fp16, y = var_9750_to_fp16)[name = tensor("aw_667_cast_fp16")]; + tensor var_9753_equation_0 = const()[name = tensor("op_9753_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9753_cast_fp16 = einsum(equation = var_9753_equation_0, values = (var_9675_cast_fp16, var_9632_cast_fp16))[name = tensor("op_9753_cast_fp16")]; + tensor var_9754_to_fp16 = const()[name = tensor("op_9754_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_669_cast_fp16 = mul(x = var_9753_cast_fp16, y = var_9754_to_fp16)[name = tensor("aw_669_cast_fp16")]; + tensor var_9757_equation_0 = const()[name = tensor("op_9757_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9757_cast_fp16 = einsum(equation = var_9757_equation_0, values = (var_9679_cast_fp16, var_9636_cast_fp16))[name = tensor("op_9757_cast_fp16")]; + tensor var_9758_to_fp16 = const()[name = tensor("op_9758_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_671_cast_fp16 = mul(x = var_9757_cast_fp16, y = var_9758_to_fp16)[name = tensor("aw_671_cast_fp16")]; + tensor var_9761_equation_0 = const()[name = tensor("op_9761_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9761_cast_fp16 = einsum(equation = var_9761_equation_0, values = (var_9683_cast_fp16, var_9640_cast_fp16))[name = tensor("op_9761_cast_fp16")]; + tensor var_9762_to_fp16 = const()[name = tensor("op_9762_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_673_cast_fp16 = mul(x = var_9761_cast_fp16, y = var_9762_to_fp16)[name = tensor("aw_673_cast_fp16")]; + tensor var_9765_equation_0 = const()[name = tensor("op_9765_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9765_cast_fp16 = einsum(equation = var_9765_equation_0, values = (var_9687_cast_fp16, var_9644_cast_fp16))[name = tensor("op_9765_cast_fp16")]; + tensor var_9766_to_fp16 = const()[name = tensor("op_9766_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_675_cast_fp16 = mul(x = var_9765_cast_fp16, y = var_9766_to_fp16)[name = tensor("aw_675_cast_fp16")]; + tensor var_9769_equation_0 = const()[name = tensor("op_9769_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9769_cast_fp16 = einsum(equation = var_9769_equation_0, values = (var_9691_cast_fp16, var_9648_cast_fp16))[name = tensor("op_9769_cast_fp16")]; + tensor var_9770_to_fp16 = const()[name = tensor("op_9770_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_677_cast_fp16 = mul(x = var_9769_cast_fp16, y = var_9770_to_fp16)[name = tensor("aw_677_cast_fp16")]; + tensor var_9773_equation_0 = const()[name = tensor("op_9773_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_9773_cast_fp16 = einsum(equation = var_9773_equation_0, values = (var_9695_cast_fp16, var_9652_cast_fp16))[name = tensor("op_9773_cast_fp16")]; + tensor var_9774_to_fp16 = const()[name = tensor("op_9774_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_679_cast_fp16 = mul(x = var_9773_cast_fp16, y = var_9774_to_fp16)[name = tensor("aw_679_cast_fp16")]; + tensor var_9776_cast_fp16 = softmax(axis = var_8627, x = aw_661_cast_fp16)[name = tensor("op_9776_cast_fp16")]; + tensor var_9777_cast_fp16 = softmax(axis = var_8627, x = aw_663_cast_fp16)[name = tensor("op_9777_cast_fp16")]; + tensor var_9778_cast_fp16 = softmax(axis = var_8627, x = aw_665_cast_fp16)[name = tensor("op_9778_cast_fp16")]; + tensor var_9779_cast_fp16 = softmax(axis = var_8627, x = aw_667_cast_fp16)[name = tensor("op_9779_cast_fp16")]; + tensor var_9780_cast_fp16 = softmax(axis = var_8627, x = aw_669_cast_fp16)[name = tensor("op_9780_cast_fp16")]; + tensor var_9781_cast_fp16 = softmax(axis = var_8627, x = aw_671_cast_fp16)[name = tensor("op_9781_cast_fp16")]; + tensor var_9782_cast_fp16 = softmax(axis = var_8627, x = aw_673_cast_fp16)[name = tensor("op_9782_cast_fp16")]; + tensor var_9783_cast_fp16 = softmax(axis = var_8627, x = aw_675_cast_fp16)[name = tensor("op_9783_cast_fp16")]; + tensor var_9784_cast_fp16 = softmax(axis = var_8627, x = aw_677_cast_fp16)[name = tensor("op_9784_cast_fp16")]; + tensor var_9785_cast_fp16 = softmax(axis = var_8627, x = aw_679_cast_fp16)[name = tensor("op_9785_cast_fp16")]; + tensor var_9787_equation_0 = const()[name = tensor("op_9787_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9787_cast_fp16 = einsum(equation = var_9787_equation_0, values = (var_9697_cast_fp16, var_9776_cast_fp16))[name = tensor("op_9787_cast_fp16")]; + tensor var_9789_equation_0 = const()[name = tensor("op_9789_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9789_cast_fp16 = einsum(equation = var_9789_equation_0, values = (var_9701_cast_fp16, var_9777_cast_fp16))[name = tensor("op_9789_cast_fp16")]; + tensor var_9791_equation_0 = const()[name = tensor("op_9791_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9791_cast_fp16 = einsum(equation = var_9791_equation_0, values = (var_9705_cast_fp16, var_9778_cast_fp16))[name = tensor("op_9791_cast_fp16")]; + tensor var_9793_equation_0 = const()[name = tensor("op_9793_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9793_cast_fp16 = einsum(equation = var_9793_equation_0, values = (var_9709_cast_fp16, var_9779_cast_fp16))[name = tensor("op_9793_cast_fp16")]; + tensor var_9795_equation_0 = const()[name = tensor("op_9795_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9795_cast_fp16 = einsum(equation = var_9795_equation_0, values = (var_9713_cast_fp16, var_9780_cast_fp16))[name = tensor("op_9795_cast_fp16")]; + tensor var_9797_equation_0 = const()[name = tensor("op_9797_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9797_cast_fp16 = einsum(equation = var_9797_equation_0, values = (var_9717_cast_fp16, var_9781_cast_fp16))[name = tensor("op_9797_cast_fp16")]; + tensor var_9799_equation_0 = const()[name = tensor("op_9799_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9799_cast_fp16 = einsum(equation = var_9799_equation_0, values = (var_9721_cast_fp16, var_9782_cast_fp16))[name = tensor("op_9799_cast_fp16")]; + tensor var_9801_equation_0 = const()[name = tensor("op_9801_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9801_cast_fp16 = einsum(equation = var_9801_equation_0, values = (var_9725_cast_fp16, var_9783_cast_fp16))[name = tensor("op_9801_cast_fp16")]; + tensor var_9803_equation_0 = const()[name = tensor("op_9803_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9803_cast_fp16 = einsum(equation = var_9803_equation_0, values = (var_9729_cast_fp16, var_9784_cast_fp16))[name = tensor("op_9803_cast_fp16")]; + tensor var_9805_equation_0 = const()[name = tensor("op_9805_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_9805_cast_fp16 = einsum(equation = var_9805_equation_0, values = (var_9733_cast_fp16, var_9785_cast_fp16))[name = tensor("op_9805_cast_fp16")]; + tensor input_411_interleave_0 = const()[name = tensor("input_411_interleave_0"), val = tensor(false)]; + tensor input_411_cast_fp16 = concat(axis = var_8627, interleave = input_411_interleave_0, values = (var_9787_cast_fp16, var_9789_cast_fp16, var_9791_cast_fp16, var_9793_cast_fp16, var_9795_cast_fp16, var_9797_cast_fp16, var_9799_cast_fp16, var_9801_cast_fp16, var_9803_cast_fp16, var_9805_cast_fp16))[name = tensor("input_411_cast_fp16")]; + tensor var_9811 = const()[name = tensor("op_9811"), val = tensor([1, 1])]; + tensor var_9813 = const()[name = tensor("op_9813"), val = tensor([1, 1])]; + tensor var_9815_pad_type_0 = const()[name = tensor("op_9815_pad_type_0"), val = tensor("custom")]; + tensor var_9815_pad_0 = const()[name = tensor("op_9815_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1634051520)))]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1634870784)))]; + tensor var_9815_cast_fp16 = conv(bias = up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_9813, groups = var_8627, pad = var_9815_pad_0, pad_type = var_9815_pad_type_0, strides = var_9811, weight = up_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_411_cast_fp16)[name = tensor("op_9815_cast_fp16")]; + tensor inputs_71_cast_fp16 = add(x = var_9815_cast_fp16, y = inputs_69_cast_fp16)[name = tensor("inputs_71_cast_fp16")]; + tensor var_9819 = const()[name = tensor("op_9819"), val = tensor([1])]; + tensor channels_mean_71_cast_fp16 = reduce_mean(axes = var_9819, keep_dims = var_8622, x = inputs_71_cast_fp16)[name = tensor("channels_mean_71_cast_fp16")]; + tensor zero_mean_71_cast_fp16 = sub(x = inputs_71_cast_fp16, y = channels_mean_71_cast_fp16)[name = tensor("zero_mean_71_cast_fp16")]; + tensor zero_mean_sq_71_cast_fp16 = mul(x = zero_mean_71_cast_fp16, y = zero_mean_71_cast_fp16)[name = tensor("zero_mean_sq_71_cast_fp16")]; + tensor var_9823 = const()[name = tensor("op_9823"), val = tensor([1])]; + tensor var_9824_cast_fp16 = reduce_mean(axes = var_9823, keep_dims = var_8622, x = zero_mean_sq_71_cast_fp16)[name = tensor("op_9824_cast_fp16")]; + tensor var_9825_to_fp16 = const()[name = tensor("op_9825_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_9826_cast_fp16 = add(x = var_9824_cast_fp16, y = var_9825_to_fp16)[name = tensor("op_9826_cast_fp16")]; + tensor denom_71_epsilon_0_to_fp16 = const()[name = tensor("denom_71_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_71_cast_fp16 = rsqrt(epsilon = denom_71_epsilon_0_to_fp16, x = var_9826_cast_fp16)[name = tensor("denom_71_cast_fp16")]; + tensor out_71_cast_fp16 = mul(x = zero_mean_71_cast_fp16, y = denom_71_cast_fp16)[name = tensor("out_71_cast_fp16")]; + tensor var_9830_to_fp16 = const()[name = tensor("op_9830_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1634872128)))]; + tensor var_9831_cast_fp16 = add(x = out_71_cast_fp16, y = var_9830_to_fp16)[name = tensor("op_9831_cast_fp16")]; + tensor var_9833_to_fp16 = const()[name = tensor("op_9833_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1634873472)))]; + tensor input_413_cast_fp16 = mul(x = var_9831_cast_fp16, y = var_9833_to_fp16)[name = tensor("input_413_cast_fp16")]; + tensor var_9841 = const()[name = tensor("op_9841"), val = tensor([1, 1])]; + tensor var_9843 = const()[name = tensor("op_9843"), val = tensor([1, 1])]; + tensor var_9845_pad_type_0 = const()[name = tensor("op_9845_pad_type_0"), val = tensor("custom")]; + tensor var_9845_pad_0 = const()[name = tensor("op_9845_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1634874816)))]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1641428480)))]; + tensor var_9845_cast_fp16 = conv(bias = up_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_9843, groups = var_8627, pad = var_9845_pad_0, pad_type = var_9845_pad_type_0, strides = var_9841, weight = up_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_413_cast_fp16)[name = tensor("op_9845_cast_fp16")]; + tensor var_9846_split_sizes_0 = const()[name = tensor("op_9846_split_sizes_0"), val = tensor([2560, 2560])]; + tensor var_9846_axis_0 = const()[name = tensor("op_9846_axis_0"), val = tensor(1)]; + tensor var_9846_cast_fp16_0, tensor var_9846_cast_fp16_1 = split(axis = var_9846_axis_0, split_sizes = var_9846_split_sizes_0, x = var_9845_cast_fp16)[name = tensor("op_9846_cast_fp16")]; + tensor var_9848_mode_0 = const()[name = tensor("op_9848_mode_0"), val = tensor("EXACT")]; + tensor var_9848_cast_fp16 = gelu(mode = var_9848_mode_0, x = var_9846_cast_fp16_1)[name = tensor("op_9848_cast_fp16")]; + tensor input_415_cast_fp16 = mul(x = var_9846_cast_fp16_0, y = var_9848_cast_fp16)[name = tensor("input_415_cast_fp16")]; + tensor var_9852 = const()[name = tensor("op_9852"), val = tensor([1, 1])]; + tensor var_9854 = const()[name = tensor("op_9854"), val = tensor([1, 1])]; + tensor var_9856_pad_type_0 = const()[name = tensor("op_9856_pad_type_0"), val = tensor("custom")]; + tensor var_9856_pad_0 = const()[name = tensor("op_9856_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1641438784)))]; + tensor up_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1644715648)))]; + tensor var_9856_cast_fp16 = conv(bias = up_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_9854, groups = var_8627, pad = var_9856_pad_0, pad_type = var_9856_pad_type_0, strides = var_9852, weight = up_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_415_cast_fp16)[name = tensor("op_9856_cast_fp16")]; + tensor hidden_states_253_cast_fp16 = add(x = var_9856_cast_fp16, y = inputs_71_cast_fp16)[name = tensor("hidden_states_253_cast_fp16")]; + tensor var_9858 = const()[name = tensor("op_9858"), val = tensor([2, 640, 24, 24])]; + tensor input_417_cast_fp16 = reshape(shape = var_9858, x = hidden_states_253_cast_fp16)[name = tensor("input_417_cast_fp16")]; + tensor var_9862 = const()[name = tensor("op_9862"), val = tensor([1, 1])]; + tensor var_9864 = const()[name = tensor("op_9864"), val = tensor([1, 1])]; + tensor hidden_states_255_pad_type_0 = const()[name = tensor("hidden_states_255_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_255_pad_0 = const()[name = tensor("hidden_states_255_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_1_proj_out_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1644716992)))]; + tensor up_blocks_2_attentions_1_proj_out_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_1_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1645536256)))]; + tensor hidden_states_255_cast_fp16 = conv(bias = up_blocks_2_attentions_1_proj_out_bias_to_fp16, dilations = var_9864, groups = var_8627, pad = hidden_states_255_pad_0, pad_type = hidden_states_255_pad_type_0, strides = var_9862, weight = up_blocks_2_attentions_1_proj_out_weight_to_fp16, x = input_417_cast_fp16)[name = tensor("hidden_states_255_cast_fp16")]; + tensor hidden_states_257_cast_fp16 = add(x = hidden_states_255_cast_fp16, y = hidden_states_243_cast_fp16)[name = tensor("hidden_states_257_cast_fp16")]; + tensor input_419_interleave_0 = const()[name = tensor("input_419_interleave_0"), val = tensor(false)]; + tensor input_419_cast_fp16 = concat(axis = var_8627, interleave = input_419_interleave_0, values = (hidden_states_257_cast_fp16, input_63_cast_fp16))[name = tensor("input_419_cast_fp16")]; + tensor reshape_192_shape_0 = const()[name = tensor("reshape_192_shape_0"), val = tensor([2, 32, 30, 24, 24])]; + tensor reshape_192_cast_fp16 = reshape(shape = reshape_192_shape_0, x = input_419_cast_fp16)[name = tensor("reshape_192_cast_fp16")]; + tensor reduce_mean_144_axes_0 = const()[name = tensor("reduce_mean_144_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_144_keep_dims_0 = const()[name = tensor("reduce_mean_144_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_144_cast_fp16 = reduce_mean(axes = reduce_mean_144_axes_0, keep_dims = reduce_mean_144_keep_dims_0, x = reshape_192_cast_fp16)[name = tensor("reduce_mean_144_cast_fp16")]; + tensor sub_96_cast_fp16 = sub(x = reshape_192_cast_fp16, y = reduce_mean_144_cast_fp16)[name = tensor("sub_96_cast_fp16")]; + tensor square_48_cast_fp16 = square(x = sub_96_cast_fp16)[name = tensor("square_48_cast_fp16")]; + tensor reduce_mean_146_axes_0 = const()[name = tensor("reduce_mean_146_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_146_keep_dims_0 = const()[name = tensor("reduce_mean_146_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_146_cast_fp16 = reduce_mean(axes = reduce_mean_146_axes_0, keep_dims = reduce_mean_146_keep_dims_0, x = square_48_cast_fp16)[name = tensor("reduce_mean_146_cast_fp16")]; + tensor add_96_y_0_to_fp16 = const()[name = tensor("add_96_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_96_cast_fp16 = add(x = reduce_mean_146_cast_fp16, y = add_96_y_0_to_fp16)[name = tensor("add_96_cast_fp16")]; + tensor sqrt_48_cast_fp16 = sqrt(x = add_96_cast_fp16)[name = tensor("sqrt_48_cast_fp16")]; + tensor real_div_48_cast_fp16 = real_div(x = sub_96_cast_fp16, y = sqrt_48_cast_fp16)[name = tensor("real_div_48_cast_fp16")]; + tensor reshape_193_shape_0 = const()[name = tensor("reshape_193_shape_0"), val = tensor([2, 960, 24, 24])]; + tensor reshape_193_cast_fp16 = reshape(shape = reshape_193_shape_0, x = real_div_48_cast_fp16)[name = tensor("reshape_193_cast_fp16")]; + tensor add_97_mean_0_to_fp16 = const()[name = tensor("add_97_mean_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1645537600)))]; + tensor add_97_variance_0_to_fp16 = const()[name = tensor("add_97_variance_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1645539584)))]; + tensor add_97_gamma_0_to_fp16 = const()[name = tensor("add_97_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1645541568)))]; + tensor add_97_beta_0_to_fp16 = const()[name = tensor("add_97_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1645543552)))]; + tensor add_97_epsilon_0_to_fp16 = const()[name = tensor("add_97_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_97_cast_fp16 = batch_norm(beta = add_97_beta_0_to_fp16, epsilon = add_97_epsilon_0_to_fp16, gamma = add_97_gamma_0_to_fp16, mean = add_97_mean_0_to_fp16, variance = add_97_variance_0_to_fp16, x = reshape_193_cast_fp16)[name = tensor("add_97_cast_fp16")]; + tensor input_423_cast_fp16 = silu(x = add_97_cast_fp16)[name = tensor("input_423_cast_fp16")]; + tensor var_9882 = const()[name = tensor("op_9882"), val = tensor([1, 1])]; + tensor var_9884 = const()[name = tensor("op_9884"), val = tensor([1, 1])]; + tensor hidden_states_259_pad_type_0 = const()[name = tensor("hidden_states_259_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_259_pad_0 = const()[name = tensor("hidden_states_259_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_2_resnets_2_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_2_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1645545536)))]; + tensor up_blocks_2_resnets_2_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_2_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1656604800)))]; + tensor hidden_states_259_cast_fp16 = conv(bias = up_blocks_2_resnets_2_conv1_bias_to_fp16, dilations = var_9884, groups = var_8627, pad = hidden_states_259_pad_0, pad_type = hidden_states_259_pad_type_0, strides = var_9882, weight = up_blocks_2_resnets_2_conv1_weight_to_fp16, x = input_423_cast_fp16)[name = tensor("hidden_states_259_cast_fp16")]; + tensor var_9890 = const()[name = tensor("op_9890"), val = tensor([1, 1])]; + tensor var_9892 = const()[name = tensor("op_9892"), val = tensor([1, 1])]; + tensor temb_37_pad_type_0 = const()[name = tensor("temb_37_pad_type_0"), val = tensor("custom")]; + tensor temb_37_pad_0 = const()[name = tensor("temb_37_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_resnets_2_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_2_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1656606144)))]; + tensor up_blocks_2_resnets_2_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_2_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1658244608)))]; + tensor temb_37_cast_fp16 = conv(bias = up_blocks_2_resnets_2_time_emb_proj_bias_to_fp16, dilations = var_9892, groups = var_8627, pad = temb_37_pad_0, pad_type = temb_37_pad_type_0, strides = var_9890, weight = up_blocks_2_resnets_2_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_37_cast_fp16")]; + tensor input_427_cast_fp16 = add(x = hidden_states_259_cast_fp16, y = temb_37_cast_fp16)[name = tensor("input_427_cast_fp16")]; + tensor reshape_196_shape_0 = const()[name = tensor("reshape_196_shape_0"), val = tensor([2, 32, 20, 24, 24])]; + tensor reshape_196_cast_fp16 = reshape(shape = reshape_196_shape_0, x = input_427_cast_fp16)[name = tensor("reshape_196_cast_fp16")]; + tensor reduce_mean_147_axes_0 = const()[name = tensor("reduce_mean_147_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_147_keep_dims_0 = const()[name = tensor("reduce_mean_147_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_147_cast_fp16 = reduce_mean(axes = reduce_mean_147_axes_0, keep_dims = reduce_mean_147_keep_dims_0, x = reshape_196_cast_fp16)[name = tensor("reduce_mean_147_cast_fp16")]; + tensor sub_98_cast_fp16 = sub(x = reshape_196_cast_fp16, y = reduce_mean_147_cast_fp16)[name = tensor("sub_98_cast_fp16")]; + tensor square_49_cast_fp16 = square(x = sub_98_cast_fp16)[name = tensor("square_49_cast_fp16")]; + tensor reduce_mean_149_axes_0 = const()[name = tensor("reduce_mean_149_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_149_keep_dims_0 = const()[name = tensor("reduce_mean_149_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_149_cast_fp16 = reduce_mean(axes = reduce_mean_149_axes_0, keep_dims = reduce_mean_149_keep_dims_0, x = square_49_cast_fp16)[name = tensor("reduce_mean_149_cast_fp16")]; + tensor add_98_y_0_to_fp16 = const()[name = tensor("add_98_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_98_cast_fp16 = add(x = reduce_mean_149_cast_fp16, y = add_98_y_0_to_fp16)[name = tensor("add_98_cast_fp16")]; + tensor sqrt_49_cast_fp16 = sqrt(x = add_98_cast_fp16)[name = tensor("sqrt_49_cast_fp16")]; + tensor real_div_49_cast_fp16 = real_div(x = sub_98_cast_fp16, y = sqrt_49_cast_fp16)[name = tensor("real_div_49_cast_fp16")]; + tensor reshape_197_shape_0 = const()[name = tensor("reshape_197_shape_0"), val = tensor([2, 640, 24, 24])]; + tensor reshape_197_cast_fp16 = reshape(shape = reshape_197_shape_0, x = real_div_49_cast_fp16)[name = tensor("reshape_197_cast_fp16")]; + tensor add_99_gamma_0_to_fp16 = const()[name = tensor("add_99_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1658245952)))]; + tensor add_99_beta_0_to_fp16 = const()[name = tensor("add_99_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1658247296)))]; + tensor add_99_epsilon_0_to_fp16 = const()[name = tensor("add_99_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_99_cast_fp16 = batch_norm(beta = add_99_beta_0_to_fp16, epsilon = add_99_epsilon_0_to_fp16, gamma = add_99_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_197_cast_fp16)[name = tensor("add_99_cast_fp16")]; + tensor input_431_cast_fp16 = silu(x = add_99_cast_fp16)[name = tensor("input_431_cast_fp16")]; + tensor var_9902 = const()[name = tensor("op_9902"), val = tensor([1, 1])]; + tensor var_9904 = const()[name = tensor("op_9904"), val = tensor([1, 1])]; + tensor hidden_states_261_pad_type_0 = const()[name = tensor("hidden_states_261_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_261_pad_0 = const()[name = tensor("hidden_states_261_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_2_resnets_2_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_2_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1658248640)))]; + tensor up_blocks_2_resnets_2_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_2_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1665621504)))]; + tensor hidden_states_261_cast_fp16 = conv(bias = up_blocks_2_resnets_2_conv2_bias_to_fp16, dilations = var_9904, groups = var_8627, pad = hidden_states_261_pad_0, pad_type = hidden_states_261_pad_type_0, strides = var_9902, weight = up_blocks_2_resnets_2_conv2_weight_to_fp16, x = input_431_cast_fp16)[name = tensor("hidden_states_261_cast_fp16")]; + tensor var_9909 = const()[name = tensor("op_9909"), val = tensor([1, 1])]; + tensor var_9911 = const()[name = tensor("op_9911"), val = tensor([1, 1])]; + tensor x_21_pad_type_0 = const()[name = tensor("x_21_pad_type_0"), val = tensor("custom")]; + tensor x_21_pad_0 = const()[name = tensor("x_21_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_resnets_2_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_2_resnets_2_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1665622848)))]; + tensor up_blocks_2_resnets_2_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_2_resnets_2_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1666851712)))]; + tensor x_21_cast_fp16 = conv(bias = up_blocks_2_resnets_2_conv_shortcut_bias_to_fp16, dilations = var_9911, groups = var_8627, pad = x_21_pad_0, pad_type = x_21_pad_type_0, strides = var_9909, weight = up_blocks_2_resnets_2_conv_shortcut_weight_to_fp16, x = input_419_cast_fp16)[name = tensor("x_21_cast_fp16")]; + tensor hidden_states_263_cast_fp16 = add(x = x_21_cast_fp16, y = hidden_states_261_cast_fp16)[name = tensor("hidden_states_263_cast_fp16")]; + tensor reshape_200_shape_0 = const()[name = tensor("reshape_200_shape_0"), val = tensor([2, 32, 20, 24, 24])]; + tensor reshape_200_cast_fp16 = reshape(shape = reshape_200_shape_0, x = hidden_states_263_cast_fp16)[name = tensor("reshape_200_cast_fp16")]; + tensor reduce_mean_150_axes_0 = const()[name = tensor("reduce_mean_150_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_150_keep_dims_0 = const()[name = tensor("reduce_mean_150_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_150_cast_fp16 = reduce_mean(axes = reduce_mean_150_axes_0, keep_dims = reduce_mean_150_keep_dims_0, x = reshape_200_cast_fp16)[name = tensor("reduce_mean_150_cast_fp16")]; + tensor sub_100_cast_fp16 = sub(x = reshape_200_cast_fp16, y = reduce_mean_150_cast_fp16)[name = tensor("sub_100_cast_fp16")]; + tensor square_50_cast_fp16 = square(x = sub_100_cast_fp16)[name = tensor("square_50_cast_fp16")]; + tensor reduce_mean_152_axes_0 = const()[name = tensor("reduce_mean_152_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_152_keep_dims_0 = const()[name = tensor("reduce_mean_152_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_152_cast_fp16 = reduce_mean(axes = reduce_mean_152_axes_0, keep_dims = reduce_mean_152_keep_dims_0, x = square_50_cast_fp16)[name = tensor("reduce_mean_152_cast_fp16")]; + tensor add_100_y_0_to_fp16 = const()[name = tensor("add_100_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_100_cast_fp16 = add(x = reduce_mean_152_cast_fp16, y = add_100_y_0_to_fp16)[name = tensor("add_100_cast_fp16")]; + tensor sqrt_50_cast_fp16 = sqrt(x = add_100_cast_fp16)[name = tensor("sqrt_50_cast_fp16")]; + tensor real_div_50_cast_fp16 = real_div(x = sub_100_cast_fp16, y = sqrt_50_cast_fp16)[name = tensor("real_div_50_cast_fp16")]; + tensor reshape_201_shape_0 = const()[name = tensor("reshape_201_shape_0"), val = tensor([2, 640, 24, 24])]; + tensor reshape_201_cast_fp16 = reshape(shape = reshape_201_shape_0, x = real_div_50_cast_fp16)[name = tensor("reshape_201_cast_fp16")]; + tensor add_101_gamma_0_to_fp16 = const()[name = tensor("add_101_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1666853056)))]; + tensor add_101_beta_0_to_fp16 = const()[name = tensor("add_101_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1666854400)))]; + tensor add_101_epsilon_0_to_fp16 = const()[name = tensor("add_101_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_101_cast_fp16 = batch_norm(beta = add_101_beta_0_to_fp16, epsilon = add_101_epsilon_0_to_fp16, gamma = add_101_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_201_cast_fp16)[name = tensor("add_101_cast_fp16")]; + tensor var_9931 = const()[name = tensor("op_9931"), val = tensor([1, 1])]; + tensor var_9933 = const()[name = tensor("op_9933"), val = tensor([1, 1])]; + tensor hidden_states_265_pad_type_0 = const()[name = tensor("hidden_states_265_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_265_pad_0 = const()[name = tensor("hidden_states_265_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_proj_in_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1666855744)))]; + tensor up_blocks_2_attentions_2_proj_in_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1667675008)))]; + tensor hidden_states_265_cast_fp16 = conv(bias = up_blocks_2_attentions_2_proj_in_bias_to_fp16, dilations = var_9933, groups = var_8627, pad = hidden_states_265_pad_0, pad_type = hidden_states_265_pad_type_0, strides = var_9931, weight = up_blocks_2_attentions_2_proj_in_weight_to_fp16, x = add_101_cast_fp16)[name = tensor("hidden_states_265_cast_fp16")]; + tensor var_9938 = const()[name = tensor("op_9938"), val = tensor([2, 640, 1, 576])]; + tensor inputs_73_cast_fp16 = reshape(shape = var_9938, x = hidden_states_265_cast_fp16)[name = tensor("inputs_73_cast_fp16")]; + tensor var_9948 = const()[name = tensor("op_9948"), val = tensor([1])]; + tensor channels_mean_73_cast_fp16 = reduce_mean(axes = var_9948, keep_dims = var_8622, x = inputs_73_cast_fp16)[name = tensor("channels_mean_73_cast_fp16")]; + tensor zero_mean_73_cast_fp16 = sub(x = inputs_73_cast_fp16, y = channels_mean_73_cast_fp16)[name = tensor("zero_mean_73_cast_fp16")]; + tensor zero_mean_sq_73_cast_fp16 = mul(x = zero_mean_73_cast_fp16, y = zero_mean_73_cast_fp16)[name = tensor("zero_mean_sq_73_cast_fp16")]; + tensor var_9952 = const()[name = tensor("op_9952"), val = tensor([1])]; + tensor var_9953_cast_fp16 = reduce_mean(axes = var_9952, keep_dims = var_8622, x = zero_mean_sq_73_cast_fp16)[name = tensor("op_9953_cast_fp16")]; + tensor var_9954_to_fp16 = const()[name = tensor("op_9954_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_9955_cast_fp16 = add(x = var_9953_cast_fp16, y = var_9954_to_fp16)[name = tensor("op_9955_cast_fp16")]; + tensor denom_73_epsilon_0_to_fp16 = const()[name = tensor("denom_73_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_73_cast_fp16 = rsqrt(epsilon = denom_73_epsilon_0_to_fp16, x = var_9955_cast_fp16)[name = tensor("denom_73_cast_fp16")]; + tensor out_73_cast_fp16 = mul(x = zero_mean_73_cast_fp16, y = denom_73_cast_fp16)[name = tensor("out_73_cast_fp16")]; + tensor var_9959_to_fp16 = const()[name = tensor("op_9959_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1667676352)))]; + tensor var_9960_cast_fp16 = add(x = out_73_cast_fp16, y = var_9959_to_fp16)[name = tensor("op_9960_cast_fp16")]; + tensor var_9962_to_fp16 = const()[name = tensor("op_9962_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1667677696)))]; + tensor hidden_states_267_cast_fp16 = mul(x = var_9960_cast_fp16, y = var_9962_to_fp16)[name = tensor("hidden_states_267_cast_fp16")]; + tensor var_9969 = const()[name = tensor("op_9969"), val = tensor([1, 1])]; + tensor var_9971 = const()[name = tensor("op_9971"), val = tensor([1, 1])]; + tensor q_49_pad_type_0 = const()[name = tensor("q_49_pad_type_0"), val = tensor("custom")]; + tensor q_49_pad_0 = const()[name = tensor("q_49_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1667679040)))]; + tensor q_49_cast_fp16 = conv(dilations = var_9971, groups = var_8627, pad = q_49_pad_0, pad_type = q_49_pad_type_0, strides = var_9969, weight = up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_267_cast_fp16)[name = tensor("q_49_cast_fp16")]; + tensor var_9975 = const()[name = tensor("op_9975"), val = tensor([1, 1])]; + tensor var_9977 = const()[name = tensor("op_9977"), val = tensor([1, 1])]; + tensor k_97_pad_type_0 = const()[name = tensor("k_97_pad_type_0"), val = tensor("custom")]; + tensor k_97_pad_0 = const()[name = tensor("k_97_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1668498304)))]; + tensor k_97_cast_fp16 = conv(dilations = var_9977, groups = var_8627, pad = k_97_pad_0, pad_type = k_97_pad_type_0, strides = var_9975, weight = up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_267_cast_fp16)[name = tensor("k_97_cast_fp16")]; + tensor var_9981 = const()[name = tensor("op_9981"), val = tensor([1, 1])]; + tensor var_9983 = const()[name = tensor("op_9983"), val = tensor([1, 1])]; + tensor v_49_pad_type_0 = const()[name = tensor("v_49_pad_type_0"), val = tensor("custom")]; + tensor v_49_pad_0 = const()[name = tensor("v_49_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1669317568)))]; + tensor v_49_cast_fp16 = conv(dilations = var_9983, groups = var_8627, pad = v_49_pad_0, pad_type = v_49_pad_type_0, strides = var_9981, weight = up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_267_cast_fp16)[name = tensor("v_49_cast_fp16")]; + tensor var_9987_begin_0 = const()[name = tensor("op_9987_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_9987_end_0 = const()[name = tensor("op_9987_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_9987_end_mask_0 = const()[name = tensor("op_9987_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9987_cast_fp16 = slice_by_index(begin = var_9987_begin_0, end = var_9987_end_0, end_mask = var_9987_end_mask_0, x = q_49_cast_fp16)[name = tensor("op_9987_cast_fp16")]; + tensor var_9991_begin_0 = const()[name = tensor("op_9991_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_9991_end_0 = const()[name = tensor("op_9991_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_9991_end_mask_0 = const()[name = tensor("op_9991_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9991_cast_fp16 = slice_by_index(begin = var_9991_begin_0, end = var_9991_end_0, end_mask = var_9991_end_mask_0, x = q_49_cast_fp16)[name = tensor("op_9991_cast_fp16")]; + tensor var_9995_begin_0 = const()[name = tensor("op_9995_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_9995_end_0 = const()[name = tensor("op_9995_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_9995_end_mask_0 = const()[name = tensor("op_9995_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9995_cast_fp16 = slice_by_index(begin = var_9995_begin_0, end = var_9995_end_0, end_mask = var_9995_end_mask_0, x = q_49_cast_fp16)[name = tensor("op_9995_cast_fp16")]; + tensor var_9999_begin_0 = const()[name = tensor("op_9999_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_9999_end_0 = const()[name = tensor("op_9999_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_9999_end_mask_0 = const()[name = tensor("op_9999_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_9999_cast_fp16 = slice_by_index(begin = var_9999_begin_0, end = var_9999_end_0, end_mask = var_9999_end_mask_0, x = q_49_cast_fp16)[name = tensor("op_9999_cast_fp16")]; + tensor var_10003_begin_0 = const()[name = tensor("op_10003_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_10003_end_0 = const()[name = tensor("op_10003_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_10003_end_mask_0 = const()[name = tensor("op_10003_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10003_cast_fp16 = slice_by_index(begin = var_10003_begin_0, end = var_10003_end_0, end_mask = var_10003_end_mask_0, x = q_49_cast_fp16)[name = tensor("op_10003_cast_fp16")]; + tensor var_10007_begin_0 = const()[name = tensor("op_10007_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_10007_end_0 = const()[name = tensor("op_10007_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_10007_end_mask_0 = const()[name = tensor("op_10007_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10007_cast_fp16 = slice_by_index(begin = var_10007_begin_0, end = var_10007_end_0, end_mask = var_10007_end_mask_0, x = q_49_cast_fp16)[name = tensor("op_10007_cast_fp16")]; + tensor var_10011_begin_0 = const()[name = tensor("op_10011_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_10011_end_0 = const()[name = tensor("op_10011_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_10011_end_mask_0 = const()[name = tensor("op_10011_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10011_cast_fp16 = slice_by_index(begin = var_10011_begin_0, end = var_10011_end_0, end_mask = var_10011_end_mask_0, x = q_49_cast_fp16)[name = tensor("op_10011_cast_fp16")]; + tensor var_10015_begin_0 = const()[name = tensor("op_10015_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_10015_end_0 = const()[name = tensor("op_10015_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_10015_end_mask_0 = const()[name = tensor("op_10015_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10015_cast_fp16 = slice_by_index(begin = var_10015_begin_0, end = var_10015_end_0, end_mask = var_10015_end_mask_0, x = q_49_cast_fp16)[name = tensor("op_10015_cast_fp16")]; + tensor var_10019_begin_0 = const()[name = tensor("op_10019_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_10019_end_0 = const()[name = tensor("op_10019_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_10019_end_mask_0 = const()[name = tensor("op_10019_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10019_cast_fp16 = slice_by_index(begin = var_10019_begin_0, end = var_10019_end_0, end_mask = var_10019_end_mask_0, x = q_49_cast_fp16)[name = tensor("op_10019_cast_fp16")]; + tensor var_10023_begin_0 = const()[name = tensor("op_10023_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_10023_end_0 = const()[name = tensor("op_10023_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_10023_end_mask_0 = const()[name = tensor("op_10023_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10023_cast_fp16 = slice_by_index(begin = var_10023_begin_0, end = var_10023_end_0, end_mask = var_10023_end_mask_0, x = q_49_cast_fp16)[name = tensor("op_10023_cast_fp16")]; + tensor k_99_perm_0 = const()[name = tensor("k_99_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_10030_begin_0 = const()[name = tensor("op_10030_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_10030_end_0 = const()[name = tensor("op_10030_end_0"), val = tensor([2, 576, 1, 64])]; + tensor var_10030_end_mask_0 = const()[name = tensor("op_10030_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_7 = transpose(perm = k_99_perm_0, x = k_97_cast_fp16)[name = tensor("transpose_7")]; + tensor var_10030_cast_fp16 = slice_by_index(begin = var_10030_begin_0, end = var_10030_end_0, end_mask = var_10030_end_mask_0, x = transpose_7)[name = tensor("op_10030_cast_fp16")]; + tensor var_10034_begin_0 = const()[name = tensor("op_10034_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_10034_end_0 = const()[name = tensor("op_10034_end_0"), val = tensor([2, 576, 1, 128])]; + tensor var_10034_end_mask_0 = const()[name = tensor("op_10034_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10034_cast_fp16 = slice_by_index(begin = var_10034_begin_0, end = var_10034_end_0, end_mask = var_10034_end_mask_0, x = transpose_7)[name = tensor("op_10034_cast_fp16")]; + tensor var_10038_begin_0 = const()[name = tensor("op_10038_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_10038_end_0 = const()[name = tensor("op_10038_end_0"), val = tensor([2, 576, 1, 192])]; + tensor var_10038_end_mask_0 = const()[name = tensor("op_10038_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10038_cast_fp16 = slice_by_index(begin = var_10038_begin_0, end = var_10038_end_0, end_mask = var_10038_end_mask_0, x = transpose_7)[name = tensor("op_10038_cast_fp16")]; + tensor var_10042_begin_0 = const()[name = tensor("op_10042_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_10042_end_0 = const()[name = tensor("op_10042_end_0"), val = tensor([2, 576, 1, 256])]; + tensor var_10042_end_mask_0 = const()[name = tensor("op_10042_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10042_cast_fp16 = slice_by_index(begin = var_10042_begin_0, end = var_10042_end_0, end_mask = var_10042_end_mask_0, x = transpose_7)[name = tensor("op_10042_cast_fp16")]; + tensor var_10046_begin_0 = const()[name = tensor("op_10046_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_10046_end_0 = const()[name = tensor("op_10046_end_0"), val = tensor([2, 576, 1, 320])]; + tensor var_10046_end_mask_0 = const()[name = tensor("op_10046_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10046_cast_fp16 = slice_by_index(begin = var_10046_begin_0, end = var_10046_end_0, end_mask = var_10046_end_mask_0, x = transpose_7)[name = tensor("op_10046_cast_fp16")]; + tensor var_10050_begin_0 = const()[name = tensor("op_10050_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_10050_end_0 = const()[name = tensor("op_10050_end_0"), val = tensor([2, 576, 1, 384])]; + tensor var_10050_end_mask_0 = const()[name = tensor("op_10050_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10050_cast_fp16 = slice_by_index(begin = var_10050_begin_0, end = var_10050_end_0, end_mask = var_10050_end_mask_0, x = transpose_7)[name = tensor("op_10050_cast_fp16")]; + tensor var_10054_begin_0 = const()[name = tensor("op_10054_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_10054_end_0 = const()[name = tensor("op_10054_end_0"), val = tensor([2, 576, 1, 448])]; + tensor var_10054_end_mask_0 = const()[name = tensor("op_10054_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10054_cast_fp16 = slice_by_index(begin = var_10054_begin_0, end = var_10054_end_0, end_mask = var_10054_end_mask_0, x = transpose_7)[name = tensor("op_10054_cast_fp16")]; + tensor var_10058_begin_0 = const()[name = tensor("op_10058_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_10058_end_0 = const()[name = tensor("op_10058_end_0"), val = tensor([2, 576, 1, 512])]; + tensor var_10058_end_mask_0 = const()[name = tensor("op_10058_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10058_cast_fp16 = slice_by_index(begin = var_10058_begin_0, end = var_10058_end_0, end_mask = var_10058_end_mask_0, x = transpose_7)[name = tensor("op_10058_cast_fp16")]; + tensor var_10062_begin_0 = const()[name = tensor("op_10062_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_10062_end_0 = const()[name = tensor("op_10062_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_10062_end_mask_0 = const()[name = tensor("op_10062_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10062_cast_fp16 = slice_by_index(begin = var_10062_begin_0, end = var_10062_end_0, end_mask = var_10062_end_mask_0, x = transpose_7)[name = tensor("op_10062_cast_fp16")]; + tensor var_10066_begin_0 = const()[name = tensor("op_10066_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_10066_end_0 = const()[name = tensor("op_10066_end_0"), val = tensor([2, 576, 1, 640])]; + tensor var_10066_end_mask_0 = const()[name = tensor("op_10066_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10066_cast_fp16 = slice_by_index(begin = var_10066_begin_0, end = var_10066_end_0, end_mask = var_10066_end_mask_0, x = transpose_7)[name = tensor("op_10066_cast_fp16")]; + tensor var_10068_begin_0 = const()[name = tensor("op_10068_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_10068_end_0 = const()[name = tensor("op_10068_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_10068_end_mask_0 = const()[name = tensor("op_10068_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10068_cast_fp16 = slice_by_index(begin = var_10068_begin_0, end = var_10068_end_0, end_mask = var_10068_end_mask_0, x = v_49_cast_fp16)[name = tensor("op_10068_cast_fp16")]; + tensor var_10072_begin_0 = const()[name = tensor("op_10072_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_10072_end_0 = const()[name = tensor("op_10072_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_10072_end_mask_0 = const()[name = tensor("op_10072_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10072_cast_fp16 = slice_by_index(begin = var_10072_begin_0, end = var_10072_end_0, end_mask = var_10072_end_mask_0, x = v_49_cast_fp16)[name = tensor("op_10072_cast_fp16")]; + tensor var_10076_begin_0 = const()[name = tensor("op_10076_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_10076_end_0 = const()[name = tensor("op_10076_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_10076_end_mask_0 = const()[name = tensor("op_10076_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10076_cast_fp16 = slice_by_index(begin = var_10076_begin_0, end = var_10076_end_0, end_mask = var_10076_end_mask_0, x = v_49_cast_fp16)[name = tensor("op_10076_cast_fp16")]; + tensor var_10080_begin_0 = const()[name = tensor("op_10080_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_10080_end_0 = const()[name = tensor("op_10080_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_10080_end_mask_0 = const()[name = tensor("op_10080_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10080_cast_fp16 = slice_by_index(begin = var_10080_begin_0, end = var_10080_end_0, end_mask = var_10080_end_mask_0, x = v_49_cast_fp16)[name = tensor("op_10080_cast_fp16")]; + tensor var_10084_begin_0 = const()[name = tensor("op_10084_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_10084_end_0 = const()[name = tensor("op_10084_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_10084_end_mask_0 = const()[name = tensor("op_10084_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10084_cast_fp16 = slice_by_index(begin = var_10084_begin_0, end = var_10084_end_0, end_mask = var_10084_end_mask_0, x = v_49_cast_fp16)[name = tensor("op_10084_cast_fp16")]; + tensor var_10088_begin_0 = const()[name = tensor("op_10088_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_10088_end_0 = const()[name = tensor("op_10088_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_10088_end_mask_0 = const()[name = tensor("op_10088_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10088_cast_fp16 = slice_by_index(begin = var_10088_begin_0, end = var_10088_end_0, end_mask = var_10088_end_mask_0, x = v_49_cast_fp16)[name = tensor("op_10088_cast_fp16")]; + tensor var_10092_begin_0 = const()[name = tensor("op_10092_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_10092_end_0 = const()[name = tensor("op_10092_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_10092_end_mask_0 = const()[name = tensor("op_10092_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10092_cast_fp16 = slice_by_index(begin = var_10092_begin_0, end = var_10092_end_0, end_mask = var_10092_end_mask_0, x = v_49_cast_fp16)[name = tensor("op_10092_cast_fp16")]; + tensor var_10096_begin_0 = const()[name = tensor("op_10096_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_10096_end_0 = const()[name = tensor("op_10096_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_10096_end_mask_0 = const()[name = tensor("op_10096_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10096_cast_fp16 = slice_by_index(begin = var_10096_begin_0, end = var_10096_end_0, end_mask = var_10096_end_mask_0, x = v_49_cast_fp16)[name = tensor("op_10096_cast_fp16")]; + tensor var_10100_begin_0 = const()[name = tensor("op_10100_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_10100_end_0 = const()[name = tensor("op_10100_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_10100_end_mask_0 = const()[name = tensor("op_10100_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10100_cast_fp16 = slice_by_index(begin = var_10100_begin_0, end = var_10100_end_0, end_mask = var_10100_end_mask_0, x = v_49_cast_fp16)[name = tensor("op_10100_cast_fp16")]; + tensor var_10104_begin_0 = const()[name = tensor("op_10104_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_10104_end_0 = const()[name = tensor("op_10104_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_10104_end_mask_0 = const()[name = tensor("op_10104_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10104_cast_fp16 = slice_by_index(begin = var_10104_begin_0, end = var_10104_end_0, end_mask = var_10104_end_mask_0, x = v_49_cast_fp16)[name = tensor("op_10104_cast_fp16")]; + tensor var_10108_equation_0 = const()[name = tensor("op_10108_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10108_cast_fp16 = einsum(equation = var_10108_equation_0, values = (var_10030_cast_fp16, var_9987_cast_fp16))[name = tensor("op_10108_cast_fp16")]; + tensor var_10109_to_fp16 = const()[name = tensor("op_10109_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_681_cast_fp16 = mul(x = var_10108_cast_fp16, y = var_10109_to_fp16)[name = tensor("aw_681_cast_fp16")]; + tensor var_10112_equation_0 = const()[name = tensor("op_10112_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10112_cast_fp16 = einsum(equation = var_10112_equation_0, values = (var_10034_cast_fp16, var_9991_cast_fp16))[name = tensor("op_10112_cast_fp16")]; + tensor var_10113_to_fp16 = const()[name = tensor("op_10113_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_683_cast_fp16 = mul(x = var_10112_cast_fp16, y = var_10113_to_fp16)[name = tensor("aw_683_cast_fp16")]; + tensor var_10116_equation_0 = const()[name = tensor("op_10116_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10116_cast_fp16 = einsum(equation = var_10116_equation_0, values = (var_10038_cast_fp16, var_9995_cast_fp16))[name = tensor("op_10116_cast_fp16")]; + tensor var_10117_to_fp16 = const()[name = tensor("op_10117_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_685_cast_fp16 = mul(x = var_10116_cast_fp16, y = var_10117_to_fp16)[name = tensor("aw_685_cast_fp16")]; + tensor var_10120_equation_0 = const()[name = tensor("op_10120_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10120_cast_fp16 = einsum(equation = var_10120_equation_0, values = (var_10042_cast_fp16, var_9999_cast_fp16))[name = tensor("op_10120_cast_fp16")]; + tensor var_10121_to_fp16 = const()[name = tensor("op_10121_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_687_cast_fp16 = mul(x = var_10120_cast_fp16, y = var_10121_to_fp16)[name = tensor("aw_687_cast_fp16")]; + tensor var_10124_equation_0 = const()[name = tensor("op_10124_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10124_cast_fp16 = einsum(equation = var_10124_equation_0, values = (var_10046_cast_fp16, var_10003_cast_fp16))[name = tensor("op_10124_cast_fp16")]; + tensor var_10125_to_fp16 = const()[name = tensor("op_10125_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_689_cast_fp16 = mul(x = var_10124_cast_fp16, y = var_10125_to_fp16)[name = tensor("aw_689_cast_fp16")]; + tensor var_10128_equation_0 = const()[name = tensor("op_10128_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10128_cast_fp16 = einsum(equation = var_10128_equation_0, values = (var_10050_cast_fp16, var_10007_cast_fp16))[name = tensor("op_10128_cast_fp16")]; + tensor var_10129_to_fp16 = const()[name = tensor("op_10129_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_691_cast_fp16 = mul(x = var_10128_cast_fp16, y = var_10129_to_fp16)[name = tensor("aw_691_cast_fp16")]; + tensor var_10132_equation_0 = const()[name = tensor("op_10132_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10132_cast_fp16 = einsum(equation = var_10132_equation_0, values = (var_10054_cast_fp16, var_10011_cast_fp16))[name = tensor("op_10132_cast_fp16")]; + tensor var_10133_to_fp16 = const()[name = tensor("op_10133_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_693_cast_fp16 = mul(x = var_10132_cast_fp16, y = var_10133_to_fp16)[name = tensor("aw_693_cast_fp16")]; + tensor var_10136_equation_0 = const()[name = tensor("op_10136_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10136_cast_fp16 = einsum(equation = var_10136_equation_0, values = (var_10058_cast_fp16, var_10015_cast_fp16))[name = tensor("op_10136_cast_fp16")]; + tensor var_10137_to_fp16 = const()[name = tensor("op_10137_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_695_cast_fp16 = mul(x = var_10136_cast_fp16, y = var_10137_to_fp16)[name = tensor("aw_695_cast_fp16")]; + tensor var_10140_equation_0 = const()[name = tensor("op_10140_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10140_cast_fp16 = einsum(equation = var_10140_equation_0, values = (var_10062_cast_fp16, var_10019_cast_fp16))[name = tensor("op_10140_cast_fp16")]; + tensor var_10141_to_fp16 = const()[name = tensor("op_10141_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_697_cast_fp16 = mul(x = var_10140_cast_fp16, y = var_10141_to_fp16)[name = tensor("aw_697_cast_fp16")]; + tensor var_10144_equation_0 = const()[name = tensor("op_10144_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10144_cast_fp16 = einsum(equation = var_10144_equation_0, values = (var_10066_cast_fp16, var_10023_cast_fp16))[name = tensor("op_10144_cast_fp16")]; + tensor var_10145_to_fp16 = const()[name = tensor("op_10145_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_699_cast_fp16 = mul(x = var_10144_cast_fp16, y = var_10145_to_fp16)[name = tensor("aw_699_cast_fp16")]; + tensor var_10147_cast_fp16 = softmax(axis = var_8627, x = aw_681_cast_fp16)[name = tensor("op_10147_cast_fp16")]; + tensor var_10148_cast_fp16 = softmax(axis = var_8627, x = aw_683_cast_fp16)[name = tensor("op_10148_cast_fp16")]; + tensor var_10149_cast_fp16 = softmax(axis = var_8627, x = aw_685_cast_fp16)[name = tensor("op_10149_cast_fp16")]; + tensor var_10150_cast_fp16 = softmax(axis = var_8627, x = aw_687_cast_fp16)[name = tensor("op_10150_cast_fp16")]; + tensor var_10151_cast_fp16 = softmax(axis = var_8627, x = aw_689_cast_fp16)[name = tensor("op_10151_cast_fp16")]; + tensor var_10152_cast_fp16 = softmax(axis = var_8627, x = aw_691_cast_fp16)[name = tensor("op_10152_cast_fp16")]; + tensor var_10153_cast_fp16 = softmax(axis = var_8627, x = aw_693_cast_fp16)[name = tensor("op_10153_cast_fp16")]; + tensor var_10154_cast_fp16 = softmax(axis = var_8627, x = aw_695_cast_fp16)[name = tensor("op_10154_cast_fp16")]; + tensor var_10155_cast_fp16 = softmax(axis = var_8627, x = aw_697_cast_fp16)[name = tensor("op_10155_cast_fp16")]; + tensor var_10156_cast_fp16 = softmax(axis = var_8627, x = aw_699_cast_fp16)[name = tensor("op_10156_cast_fp16")]; + tensor var_10158_equation_0 = const()[name = tensor("op_10158_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10158_cast_fp16 = einsum(equation = var_10158_equation_0, values = (var_10068_cast_fp16, var_10147_cast_fp16))[name = tensor("op_10158_cast_fp16")]; + tensor var_10160_equation_0 = const()[name = tensor("op_10160_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10160_cast_fp16 = einsum(equation = var_10160_equation_0, values = (var_10072_cast_fp16, var_10148_cast_fp16))[name = tensor("op_10160_cast_fp16")]; + tensor var_10162_equation_0 = const()[name = tensor("op_10162_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10162_cast_fp16 = einsum(equation = var_10162_equation_0, values = (var_10076_cast_fp16, var_10149_cast_fp16))[name = tensor("op_10162_cast_fp16")]; + tensor var_10164_equation_0 = const()[name = tensor("op_10164_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10164_cast_fp16 = einsum(equation = var_10164_equation_0, values = (var_10080_cast_fp16, var_10150_cast_fp16))[name = tensor("op_10164_cast_fp16")]; + tensor var_10166_equation_0 = const()[name = tensor("op_10166_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10166_cast_fp16 = einsum(equation = var_10166_equation_0, values = (var_10084_cast_fp16, var_10151_cast_fp16))[name = tensor("op_10166_cast_fp16")]; + tensor var_10168_equation_0 = const()[name = tensor("op_10168_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10168_cast_fp16 = einsum(equation = var_10168_equation_0, values = (var_10088_cast_fp16, var_10152_cast_fp16))[name = tensor("op_10168_cast_fp16")]; + tensor var_10170_equation_0 = const()[name = tensor("op_10170_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10170_cast_fp16 = einsum(equation = var_10170_equation_0, values = (var_10092_cast_fp16, var_10153_cast_fp16))[name = tensor("op_10170_cast_fp16")]; + tensor var_10172_equation_0 = const()[name = tensor("op_10172_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10172_cast_fp16 = einsum(equation = var_10172_equation_0, values = (var_10096_cast_fp16, var_10154_cast_fp16))[name = tensor("op_10172_cast_fp16")]; + tensor var_10174_equation_0 = const()[name = tensor("op_10174_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10174_cast_fp16 = einsum(equation = var_10174_equation_0, values = (var_10100_cast_fp16, var_10155_cast_fp16))[name = tensor("op_10174_cast_fp16")]; + tensor var_10176_equation_0 = const()[name = tensor("op_10176_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10176_cast_fp16 = einsum(equation = var_10176_equation_0, values = (var_10104_cast_fp16, var_10156_cast_fp16))[name = tensor("op_10176_cast_fp16")]; + tensor input_435_interleave_0 = const()[name = tensor("input_435_interleave_0"), val = tensor(false)]; + tensor input_435_cast_fp16 = concat(axis = var_8627, interleave = input_435_interleave_0, values = (var_10158_cast_fp16, var_10160_cast_fp16, var_10162_cast_fp16, var_10164_cast_fp16, var_10166_cast_fp16, var_10168_cast_fp16, var_10170_cast_fp16, var_10172_cast_fp16, var_10174_cast_fp16, var_10176_cast_fp16))[name = tensor("input_435_cast_fp16")]; + tensor var_10182 = const()[name = tensor("op_10182"), val = tensor([1, 1])]; + tensor var_10184 = const()[name = tensor("op_10184"), val = tensor([1, 1])]; + tensor var_10186_pad_type_0 = const()[name = tensor("op_10186_pad_type_0"), val = tensor("custom")]; + tensor var_10186_pad_0 = const()[name = tensor("op_10186_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1670136832)))]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1670956096)))]; + tensor var_10186_cast_fp16 = conv(bias = up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_10184, groups = var_8627, pad = var_10186_pad_0, pad_type = var_10186_pad_type_0, strides = var_10182, weight = up_blocks_2_attentions_2_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_435_cast_fp16)[name = tensor("op_10186_cast_fp16")]; + tensor inputs_75_cast_fp16 = add(x = var_10186_cast_fp16, y = inputs_73_cast_fp16)[name = tensor("inputs_75_cast_fp16")]; + tensor var_10190 = const()[name = tensor("op_10190"), val = tensor([1])]; + tensor channels_mean_75_cast_fp16 = reduce_mean(axes = var_10190, keep_dims = var_8622, x = inputs_75_cast_fp16)[name = tensor("channels_mean_75_cast_fp16")]; + tensor zero_mean_75_cast_fp16 = sub(x = inputs_75_cast_fp16, y = channels_mean_75_cast_fp16)[name = tensor("zero_mean_75_cast_fp16")]; + tensor zero_mean_sq_75_cast_fp16 = mul(x = zero_mean_75_cast_fp16, y = zero_mean_75_cast_fp16)[name = tensor("zero_mean_sq_75_cast_fp16")]; + tensor var_10194 = const()[name = tensor("op_10194"), val = tensor([1])]; + tensor var_10195_cast_fp16 = reduce_mean(axes = var_10194, keep_dims = var_8622, x = zero_mean_sq_75_cast_fp16)[name = tensor("op_10195_cast_fp16")]; + tensor var_10196_to_fp16 = const()[name = tensor("op_10196_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_10197_cast_fp16 = add(x = var_10195_cast_fp16, y = var_10196_to_fp16)[name = tensor("op_10197_cast_fp16")]; + tensor denom_75_epsilon_0_to_fp16 = const()[name = tensor("denom_75_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_75_cast_fp16 = rsqrt(epsilon = denom_75_epsilon_0_to_fp16, x = var_10197_cast_fp16)[name = tensor("denom_75_cast_fp16")]; + tensor out_75_cast_fp16 = mul(x = zero_mean_75_cast_fp16, y = denom_75_cast_fp16)[name = tensor("out_75_cast_fp16")]; + tensor var_10201_to_fp16 = const()[name = tensor("op_10201_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1670957440)))]; + tensor var_10202_cast_fp16 = add(x = out_75_cast_fp16, y = var_10201_to_fp16)[name = tensor("op_10202_cast_fp16")]; + tensor var_10204_to_fp16 = const()[name = tensor("op_10204_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1670958784)))]; + tensor hidden_states_269_cast_fp16 = mul(x = var_10202_cast_fp16, y = var_10204_to_fp16)[name = tensor("hidden_states_269_cast_fp16")]; + tensor var_10211 = const()[name = tensor("op_10211"), val = tensor([1, 1])]; + tensor var_10213 = const()[name = tensor("op_10213"), val = tensor([1, 1])]; + tensor q_51_pad_type_0 = const()[name = tensor("q_51_pad_type_0"), val = tensor("custom")]; + tensor q_51_pad_0 = const()[name = tensor("q_51_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1670960128)))]; + tensor q_51_cast_fp16 = conv(dilations = var_10213, groups = var_8627, pad = q_51_pad_0, pad_type = q_51_pad_type_0, strides = var_10211, weight = up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_269_cast_fp16)[name = tensor("q_51_cast_fp16")]; + tensor var_10217 = const()[name = tensor("op_10217"), val = tensor([1, 1])]; + tensor var_10219 = const()[name = tensor("op_10219"), val = tensor([1, 1])]; + tensor k_101_pad_type_0 = const()[name = tensor("k_101_pad_type_0"), val = tensor("custom")]; + tensor k_101_pad_0 = const()[name = tensor("k_101_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1671779392)))]; + tensor k_101_cast_fp16 = conv(dilations = var_10219, groups = var_8627, pad = k_101_pad_0, pad_type = k_101_pad_type_0, strides = var_10217, weight = up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_101_cast_fp16")]; + tensor var_10223 = const()[name = tensor("op_10223"), val = tensor([1, 1])]; + tensor var_10225 = const()[name = tensor("op_10225"), val = tensor([1, 1])]; + tensor v_51_pad_type_0 = const()[name = tensor("v_51_pad_type_0"), val = tensor("custom")]; + tensor v_51_pad_0 = const()[name = tensor("v_51_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1673090176)))]; + tensor v_51_cast_fp16 = conv(dilations = var_10225, groups = var_8627, pad = v_51_pad_0, pad_type = v_51_pad_type_0, strides = var_10223, weight = up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_51_cast_fp16")]; + tensor var_10229_begin_0 = const()[name = tensor("op_10229_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_10229_end_0 = const()[name = tensor("op_10229_end_0"), val = tensor([2, 64, 1, 576])]; + tensor var_10229_end_mask_0 = const()[name = tensor("op_10229_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10229_cast_fp16 = slice_by_index(begin = var_10229_begin_0, end = var_10229_end_0, end_mask = var_10229_end_mask_0, x = q_51_cast_fp16)[name = tensor("op_10229_cast_fp16")]; + tensor var_10233_begin_0 = const()[name = tensor("op_10233_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_10233_end_0 = const()[name = tensor("op_10233_end_0"), val = tensor([2, 128, 1, 576])]; + tensor var_10233_end_mask_0 = const()[name = tensor("op_10233_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10233_cast_fp16 = slice_by_index(begin = var_10233_begin_0, end = var_10233_end_0, end_mask = var_10233_end_mask_0, x = q_51_cast_fp16)[name = tensor("op_10233_cast_fp16")]; + tensor var_10237_begin_0 = const()[name = tensor("op_10237_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_10237_end_0 = const()[name = tensor("op_10237_end_0"), val = tensor([2, 192, 1, 576])]; + tensor var_10237_end_mask_0 = const()[name = tensor("op_10237_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10237_cast_fp16 = slice_by_index(begin = var_10237_begin_0, end = var_10237_end_0, end_mask = var_10237_end_mask_0, x = q_51_cast_fp16)[name = tensor("op_10237_cast_fp16")]; + tensor var_10241_begin_0 = const()[name = tensor("op_10241_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_10241_end_0 = const()[name = tensor("op_10241_end_0"), val = tensor([2, 256, 1, 576])]; + tensor var_10241_end_mask_0 = const()[name = tensor("op_10241_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10241_cast_fp16 = slice_by_index(begin = var_10241_begin_0, end = var_10241_end_0, end_mask = var_10241_end_mask_0, x = q_51_cast_fp16)[name = tensor("op_10241_cast_fp16")]; + tensor var_10245_begin_0 = const()[name = tensor("op_10245_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_10245_end_0 = const()[name = tensor("op_10245_end_0"), val = tensor([2, 320, 1, 576])]; + tensor var_10245_end_mask_0 = const()[name = tensor("op_10245_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10245_cast_fp16 = slice_by_index(begin = var_10245_begin_0, end = var_10245_end_0, end_mask = var_10245_end_mask_0, x = q_51_cast_fp16)[name = tensor("op_10245_cast_fp16")]; + tensor var_10249_begin_0 = const()[name = tensor("op_10249_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_10249_end_0 = const()[name = tensor("op_10249_end_0"), val = tensor([2, 384, 1, 576])]; + tensor var_10249_end_mask_0 = const()[name = tensor("op_10249_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10249_cast_fp16 = slice_by_index(begin = var_10249_begin_0, end = var_10249_end_0, end_mask = var_10249_end_mask_0, x = q_51_cast_fp16)[name = tensor("op_10249_cast_fp16")]; + tensor var_10253_begin_0 = const()[name = tensor("op_10253_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_10253_end_0 = const()[name = tensor("op_10253_end_0"), val = tensor([2, 448, 1, 576])]; + tensor var_10253_end_mask_0 = const()[name = tensor("op_10253_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10253_cast_fp16 = slice_by_index(begin = var_10253_begin_0, end = var_10253_end_0, end_mask = var_10253_end_mask_0, x = q_51_cast_fp16)[name = tensor("op_10253_cast_fp16")]; + tensor var_10257_begin_0 = const()[name = tensor("op_10257_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_10257_end_0 = const()[name = tensor("op_10257_end_0"), val = tensor([2, 512, 1, 576])]; + tensor var_10257_end_mask_0 = const()[name = tensor("op_10257_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10257_cast_fp16 = slice_by_index(begin = var_10257_begin_0, end = var_10257_end_0, end_mask = var_10257_end_mask_0, x = q_51_cast_fp16)[name = tensor("op_10257_cast_fp16")]; + tensor var_10261_begin_0 = const()[name = tensor("op_10261_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_10261_end_0 = const()[name = tensor("op_10261_end_0"), val = tensor([2, 576, 1, 576])]; + tensor var_10261_end_mask_0 = const()[name = tensor("op_10261_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10261_cast_fp16 = slice_by_index(begin = var_10261_begin_0, end = var_10261_end_0, end_mask = var_10261_end_mask_0, x = q_51_cast_fp16)[name = tensor("op_10261_cast_fp16")]; + tensor var_10265_begin_0 = const()[name = tensor("op_10265_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_10265_end_0 = const()[name = tensor("op_10265_end_0"), val = tensor([2, 640, 1, 576])]; + tensor var_10265_end_mask_0 = const()[name = tensor("op_10265_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10265_cast_fp16 = slice_by_index(begin = var_10265_begin_0, end = var_10265_end_0, end_mask = var_10265_end_mask_0, x = q_51_cast_fp16)[name = tensor("op_10265_cast_fp16")]; + tensor k_103_perm_0 = const()[name = tensor("k_103_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_10272_begin_0 = const()[name = tensor("op_10272_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_10272_end_0 = const()[name = tensor("op_10272_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_10272_end_mask_0 = const()[name = tensor("op_10272_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_6 = transpose(perm = k_103_perm_0, x = k_101_cast_fp16)[name = tensor("transpose_6")]; + tensor var_10272_cast_fp16 = slice_by_index(begin = var_10272_begin_0, end = var_10272_end_0, end_mask = var_10272_end_mask_0, x = transpose_6)[name = tensor("op_10272_cast_fp16")]; + tensor var_10276_begin_0 = const()[name = tensor("op_10276_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_10276_end_0 = const()[name = tensor("op_10276_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_10276_end_mask_0 = const()[name = tensor("op_10276_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10276_cast_fp16 = slice_by_index(begin = var_10276_begin_0, end = var_10276_end_0, end_mask = var_10276_end_mask_0, x = transpose_6)[name = tensor("op_10276_cast_fp16")]; + tensor var_10280_begin_0 = const()[name = tensor("op_10280_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_10280_end_0 = const()[name = tensor("op_10280_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_10280_end_mask_0 = const()[name = tensor("op_10280_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10280_cast_fp16 = slice_by_index(begin = var_10280_begin_0, end = var_10280_end_0, end_mask = var_10280_end_mask_0, x = transpose_6)[name = tensor("op_10280_cast_fp16")]; + tensor var_10284_begin_0 = const()[name = tensor("op_10284_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_10284_end_0 = const()[name = tensor("op_10284_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_10284_end_mask_0 = const()[name = tensor("op_10284_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10284_cast_fp16 = slice_by_index(begin = var_10284_begin_0, end = var_10284_end_0, end_mask = var_10284_end_mask_0, x = transpose_6)[name = tensor("op_10284_cast_fp16")]; + tensor var_10288_begin_0 = const()[name = tensor("op_10288_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_10288_end_0 = const()[name = tensor("op_10288_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_10288_end_mask_0 = const()[name = tensor("op_10288_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10288_cast_fp16 = slice_by_index(begin = var_10288_begin_0, end = var_10288_end_0, end_mask = var_10288_end_mask_0, x = transpose_6)[name = tensor("op_10288_cast_fp16")]; + tensor var_10292_begin_0 = const()[name = tensor("op_10292_begin_0"), val = tensor([0, 0, 0, 320])]; + tensor var_10292_end_0 = const()[name = tensor("op_10292_end_0"), val = tensor([2, 77, 1, 384])]; + tensor var_10292_end_mask_0 = const()[name = tensor("op_10292_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10292_cast_fp16 = slice_by_index(begin = var_10292_begin_0, end = var_10292_end_0, end_mask = var_10292_end_mask_0, x = transpose_6)[name = tensor("op_10292_cast_fp16")]; + tensor var_10296_begin_0 = const()[name = tensor("op_10296_begin_0"), val = tensor([0, 0, 0, 384])]; + tensor var_10296_end_0 = const()[name = tensor("op_10296_end_0"), val = tensor([2, 77, 1, 448])]; + tensor var_10296_end_mask_0 = const()[name = tensor("op_10296_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10296_cast_fp16 = slice_by_index(begin = var_10296_begin_0, end = var_10296_end_0, end_mask = var_10296_end_mask_0, x = transpose_6)[name = tensor("op_10296_cast_fp16")]; + tensor var_10300_begin_0 = const()[name = tensor("op_10300_begin_0"), val = tensor([0, 0, 0, 448])]; + tensor var_10300_end_0 = const()[name = tensor("op_10300_end_0"), val = tensor([2, 77, 1, 512])]; + tensor var_10300_end_mask_0 = const()[name = tensor("op_10300_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10300_cast_fp16 = slice_by_index(begin = var_10300_begin_0, end = var_10300_end_0, end_mask = var_10300_end_mask_0, x = transpose_6)[name = tensor("op_10300_cast_fp16")]; + tensor var_10304_begin_0 = const()[name = tensor("op_10304_begin_0"), val = tensor([0, 0, 0, 512])]; + tensor var_10304_end_0 = const()[name = tensor("op_10304_end_0"), val = tensor([2, 77, 1, 576])]; + tensor var_10304_end_mask_0 = const()[name = tensor("op_10304_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10304_cast_fp16 = slice_by_index(begin = var_10304_begin_0, end = var_10304_end_0, end_mask = var_10304_end_mask_0, x = transpose_6)[name = tensor("op_10304_cast_fp16")]; + tensor var_10308_begin_0 = const()[name = tensor("op_10308_begin_0"), val = tensor([0, 0, 0, 576])]; + tensor var_10308_end_0 = const()[name = tensor("op_10308_end_0"), val = tensor([2, 77, 1, 640])]; + tensor var_10308_end_mask_0 = const()[name = tensor("op_10308_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10308_cast_fp16 = slice_by_index(begin = var_10308_begin_0, end = var_10308_end_0, end_mask = var_10308_end_mask_0, x = transpose_6)[name = tensor("op_10308_cast_fp16")]; + tensor var_10310_begin_0 = const()[name = tensor("op_10310_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_10310_end_0 = const()[name = tensor("op_10310_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_10310_end_mask_0 = const()[name = tensor("op_10310_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10310_cast_fp16 = slice_by_index(begin = var_10310_begin_0, end = var_10310_end_0, end_mask = var_10310_end_mask_0, x = v_51_cast_fp16)[name = tensor("op_10310_cast_fp16")]; + tensor var_10314_begin_0 = const()[name = tensor("op_10314_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_10314_end_0 = const()[name = tensor("op_10314_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_10314_end_mask_0 = const()[name = tensor("op_10314_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10314_cast_fp16 = slice_by_index(begin = var_10314_begin_0, end = var_10314_end_0, end_mask = var_10314_end_mask_0, x = v_51_cast_fp16)[name = tensor("op_10314_cast_fp16")]; + tensor var_10318_begin_0 = const()[name = tensor("op_10318_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_10318_end_0 = const()[name = tensor("op_10318_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_10318_end_mask_0 = const()[name = tensor("op_10318_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10318_cast_fp16 = slice_by_index(begin = var_10318_begin_0, end = var_10318_end_0, end_mask = var_10318_end_mask_0, x = v_51_cast_fp16)[name = tensor("op_10318_cast_fp16")]; + tensor var_10322_begin_0 = const()[name = tensor("op_10322_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_10322_end_0 = const()[name = tensor("op_10322_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_10322_end_mask_0 = const()[name = tensor("op_10322_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10322_cast_fp16 = slice_by_index(begin = var_10322_begin_0, end = var_10322_end_0, end_mask = var_10322_end_mask_0, x = v_51_cast_fp16)[name = tensor("op_10322_cast_fp16")]; + tensor var_10326_begin_0 = const()[name = tensor("op_10326_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_10326_end_0 = const()[name = tensor("op_10326_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_10326_end_mask_0 = const()[name = tensor("op_10326_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10326_cast_fp16 = slice_by_index(begin = var_10326_begin_0, end = var_10326_end_0, end_mask = var_10326_end_mask_0, x = v_51_cast_fp16)[name = tensor("op_10326_cast_fp16")]; + tensor var_10330_begin_0 = const()[name = tensor("op_10330_begin_0"), val = tensor([0, 320, 0, 0])]; + tensor var_10330_end_0 = const()[name = tensor("op_10330_end_0"), val = tensor([2, 384, 1, 77])]; + tensor var_10330_end_mask_0 = const()[name = tensor("op_10330_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10330_cast_fp16 = slice_by_index(begin = var_10330_begin_0, end = var_10330_end_0, end_mask = var_10330_end_mask_0, x = v_51_cast_fp16)[name = tensor("op_10330_cast_fp16")]; + tensor var_10334_begin_0 = const()[name = tensor("op_10334_begin_0"), val = tensor([0, 384, 0, 0])]; + tensor var_10334_end_0 = const()[name = tensor("op_10334_end_0"), val = tensor([2, 448, 1, 77])]; + tensor var_10334_end_mask_0 = const()[name = tensor("op_10334_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10334_cast_fp16 = slice_by_index(begin = var_10334_begin_0, end = var_10334_end_0, end_mask = var_10334_end_mask_0, x = v_51_cast_fp16)[name = tensor("op_10334_cast_fp16")]; + tensor var_10338_begin_0 = const()[name = tensor("op_10338_begin_0"), val = tensor([0, 448, 0, 0])]; + tensor var_10338_end_0 = const()[name = tensor("op_10338_end_0"), val = tensor([2, 512, 1, 77])]; + tensor var_10338_end_mask_0 = const()[name = tensor("op_10338_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10338_cast_fp16 = slice_by_index(begin = var_10338_begin_0, end = var_10338_end_0, end_mask = var_10338_end_mask_0, x = v_51_cast_fp16)[name = tensor("op_10338_cast_fp16")]; + tensor var_10342_begin_0 = const()[name = tensor("op_10342_begin_0"), val = tensor([0, 512, 0, 0])]; + tensor var_10342_end_0 = const()[name = tensor("op_10342_end_0"), val = tensor([2, 576, 1, 77])]; + tensor var_10342_end_mask_0 = const()[name = tensor("op_10342_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10342_cast_fp16 = slice_by_index(begin = var_10342_begin_0, end = var_10342_end_0, end_mask = var_10342_end_mask_0, x = v_51_cast_fp16)[name = tensor("op_10342_cast_fp16")]; + tensor var_10346_begin_0 = const()[name = tensor("op_10346_begin_0"), val = tensor([0, 576, 0, 0])]; + tensor var_10346_end_0 = const()[name = tensor("op_10346_end_0"), val = tensor([2, 640, 1, 77])]; + tensor var_10346_end_mask_0 = const()[name = tensor("op_10346_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10346_cast_fp16 = slice_by_index(begin = var_10346_begin_0, end = var_10346_end_0, end_mask = var_10346_end_mask_0, x = v_51_cast_fp16)[name = tensor("op_10346_cast_fp16")]; + tensor var_10350_equation_0 = const()[name = tensor("op_10350_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10350_cast_fp16 = einsum(equation = var_10350_equation_0, values = (var_10272_cast_fp16, var_10229_cast_fp16))[name = tensor("op_10350_cast_fp16")]; + tensor var_10351_to_fp16 = const()[name = tensor("op_10351_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_701_cast_fp16 = mul(x = var_10350_cast_fp16, y = var_10351_to_fp16)[name = tensor("aw_701_cast_fp16")]; + tensor var_10354_equation_0 = const()[name = tensor("op_10354_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10354_cast_fp16 = einsum(equation = var_10354_equation_0, values = (var_10276_cast_fp16, var_10233_cast_fp16))[name = tensor("op_10354_cast_fp16")]; + tensor var_10355_to_fp16 = const()[name = tensor("op_10355_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_703_cast_fp16 = mul(x = var_10354_cast_fp16, y = var_10355_to_fp16)[name = tensor("aw_703_cast_fp16")]; + tensor var_10358_equation_0 = const()[name = tensor("op_10358_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10358_cast_fp16 = einsum(equation = var_10358_equation_0, values = (var_10280_cast_fp16, var_10237_cast_fp16))[name = tensor("op_10358_cast_fp16")]; + tensor var_10359_to_fp16 = const()[name = tensor("op_10359_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_705_cast_fp16 = mul(x = var_10358_cast_fp16, y = var_10359_to_fp16)[name = tensor("aw_705_cast_fp16")]; + tensor var_10362_equation_0 = const()[name = tensor("op_10362_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10362_cast_fp16 = einsum(equation = var_10362_equation_0, values = (var_10284_cast_fp16, var_10241_cast_fp16))[name = tensor("op_10362_cast_fp16")]; + tensor var_10363_to_fp16 = const()[name = tensor("op_10363_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_707_cast_fp16 = mul(x = var_10362_cast_fp16, y = var_10363_to_fp16)[name = tensor("aw_707_cast_fp16")]; + tensor var_10366_equation_0 = const()[name = tensor("op_10366_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10366_cast_fp16 = einsum(equation = var_10366_equation_0, values = (var_10288_cast_fp16, var_10245_cast_fp16))[name = tensor("op_10366_cast_fp16")]; + tensor var_10367_to_fp16 = const()[name = tensor("op_10367_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_709_cast_fp16 = mul(x = var_10366_cast_fp16, y = var_10367_to_fp16)[name = tensor("aw_709_cast_fp16")]; + tensor var_10370_equation_0 = const()[name = tensor("op_10370_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10370_cast_fp16 = einsum(equation = var_10370_equation_0, values = (var_10292_cast_fp16, var_10249_cast_fp16))[name = tensor("op_10370_cast_fp16")]; + tensor var_10371_to_fp16 = const()[name = tensor("op_10371_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_711_cast_fp16 = mul(x = var_10370_cast_fp16, y = var_10371_to_fp16)[name = tensor("aw_711_cast_fp16")]; + tensor var_10374_equation_0 = const()[name = tensor("op_10374_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10374_cast_fp16 = einsum(equation = var_10374_equation_0, values = (var_10296_cast_fp16, var_10253_cast_fp16))[name = tensor("op_10374_cast_fp16")]; + tensor var_10375_to_fp16 = const()[name = tensor("op_10375_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_713_cast_fp16 = mul(x = var_10374_cast_fp16, y = var_10375_to_fp16)[name = tensor("aw_713_cast_fp16")]; + tensor var_10378_equation_0 = const()[name = tensor("op_10378_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10378_cast_fp16 = einsum(equation = var_10378_equation_0, values = (var_10300_cast_fp16, var_10257_cast_fp16))[name = tensor("op_10378_cast_fp16")]; + tensor var_10379_to_fp16 = const()[name = tensor("op_10379_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_715_cast_fp16 = mul(x = var_10378_cast_fp16, y = var_10379_to_fp16)[name = tensor("aw_715_cast_fp16")]; + tensor var_10382_equation_0 = const()[name = tensor("op_10382_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10382_cast_fp16 = einsum(equation = var_10382_equation_0, values = (var_10304_cast_fp16, var_10261_cast_fp16))[name = tensor("op_10382_cast_fp16")]; + tensor var_10383_to_fp16 = const()[name = tensor("op_10383_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_717_cast_fp16 = mul(x = var_10382_cast_fp16, y = var_10383_to_fp16)[name = tensor("aw_717_cast_fp16")]; + tensor var_10386_equation_0 = const()[name = tensor("op_10386_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10386_cast_fp16 = einsum(equation = var_10386_equation_0, values = (var_10308_cast_fp16, var_10265_cast_fp16))[name = tensor("op_10386_cast_fp16")]; + tensor var_10387_to_fp16 = const()[name = tensor("op_10387_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_719_cast_fp16 = mul(x = var_10386_cast_fp16, y = var_10387_to_fp16)[name = tensor("aw_719_cast_fp16")]; + tensor var_10389_cast_fp16 = softmax(axis = var_8627, x = aw_701_cast_fp16)[name = tensor("op_10389_cast_fp16")]; + tensor var_10390_cast_fp16 = softmax(axis = var_8627, x = aw_703_cast_fp16)[name = tensor("op_10390_cast_fp16")]; + tensor var_10391_cast_fp16 = softmax(axis = var_8627, x = aw_705_cast_fp16)[name = tensor("op_10391_cast_fp16")]; + tensor var_10392_cast_fp16 = softmax(axis = var_8627, x = aw_707_cast_fp16)[name = tensor("op_10392_cast_fp16")]; + tensor var_10393_cast_fp16 = softmax(axis = var_8627, x = aw_709_cast_fp16)[name = tensor("op_10393_cast_fp16")]; + tensor var_10394_cast_fp16 = softmax(axis = var_8627, x = aw_711_cast_fp16)[name = tensor("op_10394_cast_fp16")]; + tensor var_10395_cast_fp16 = softmax(axis = var_8627, x = aw_713_cast_fp16)[name = tensor("op_10395_cast_fp16")]; + tensor var_10396_cast_fp16 = softmax(axis = var_8627, x = aw_715_cast_fp16)[name = tensor("op_10396_cast_fp16")]; + tensor var_10397_cast_fp16 = softmax(axis = var_8627, x = aw_717_cast_fp16)[name = tensor("op_10397_cast_fp16")]; + tensor var_10398_cast_fp16 = softmax(axis = var_8627, x = aw_719_cast_fp16)[name = tensor("op_10398_cast_fp16")]; + tensor var_10400_equation_0 = const()[name = tensor("op_10400_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10400_cast_fp16 = einsum(equation = var_10400_equation_0, values = (var_10310_cast_fp16, var_10389_cast_fp16))[name = tensor("op_10400_cast_fp16")]; + tensor var_10402_equation_0 = const()[name = tensor("op_10402_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10402_cast_fp16 = einsum(equation = var_10402_equation_0, values = (var_10314_cast_fp16, var_10390_cast_fp16))[name = tensor("op_10402_cast_fp16")]; + tensor var_10404_equation_0 = const()[name = tensor("op_10404_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10404_cast_fp16 = einsum(equation = var_10404_equation_0, values = (var_10318_cast_fp16, var_10391_cast_fp16))[name = tensor("op_10404_cast_fp16")]; + tensor var_10406_equation_0 = const()[name = tensor("op_10406_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10406_cast_fp16 = einsum(equation = var_10406_equation_0, values = (var_10322_cast_fp16, var_10392_cast_fp16))[name = tensor("op_10406_cast_fp16")]; + tensor var_10408_equation_0 = const()[name = tensor("op_10408_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10408_cast_fp16 = einsum(equation = var_10408_equation_0, values = (var_10326_cast_fp16, var_10393_cast_fp16))[name = tensor("op_10408_cast_fp16")]; + tensor var_10410_equation_0 = const()[name = tensor("op_10410_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10410_cast_fp16 = einsum(equation = var_10410_equation_0, values = (var_10330_cast_fp16, var_10394_cast_fp16))[name = tensor("op_10410_cast_fp16")]; + tensor var_10412_equation_0 = const()[name = tensor("op_10412_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10412_cast_fp16 = einsum(equation = var_10412_equation_0, values = (var_10334_cast_fp16, var_10395_cast_fp16))[name = tensor("op_10412_cast_fp16")]; + tensor var_10414_equation_0 = const()[name = tensor("op_10414_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10414_cast_fp16 = einsum(equation = var_10414_equation_0, values = (var_10338_cast_fp16, var_10396_cast_fp16))[name = tensor("op_10414_cast_fp16")]; + tensor var_10416_equation_0 = const()[name = tensor("op_10416_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10416_cast_fp16 = einsum(equation = var_10416_equation_0, values = (var_10342_cast_fp16, var_10397_cast_fp16))[name = tensor("op_10416_cast_fp16")]; + tensor var_10418_equation_0 = const()[name = tensor("op_10418_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10418_cast_fp16 = einsum(equation = var_10418_equation_0, values = (var_10346_cast_fp16, var_10398_cast_fp16))[name = tensor("op_10418_cast_fp16")]; + tensor input_437_interleave_0 = const()[name = tensor("input_437_interleave_0"), val = tensor(false)]; + tensor input_437_cast_fp16 = concat(axis = var_8627, interleave = input_437_interleave_0, values = (var_10400_cast_fp16, var_10402_cast_fp16, var_10404_cast_fp16, var_10406_cast_fp16, var_10408_cast_fp16, var_10410_cast_fp16, var_10412_cast_fp16, var_10414_cast_fp16, var_10416_cast_fp16, var_10418_cast_fp16))[name = tensor("input_437_cast_fp16")]; + tensor var_10424 = const()[name = tensor("op_10424"), val = tensor([1, 1])]; + tensor var_10426 = const()[name = tensor("op_10426"), val = tensor([1, 1])]; + tensor var_10428_pad_type_0 = const()[name = tensor("op_10428_pad_type_0"), val = tensor("custom")]; + tensor var_10428_pad_0 = const()[name = tensor("op_10428_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1674400960)))]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1675220224)))]; + tensor var_10428_cast_fp16 = conv(bias = up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_10426, groups = var_8627, pad = var_10428_pad_0, pad_type = var_10428_pad_type_0, strides = var_10424, weight = up_blocks_2_attentions_2_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_437_cast_fp16)[name = tensor("op_10428_cast_fp16")]; + tensor inputs_77_cast_fp16 = add(x = var_10428_cast_fp16, y = inputs_75_cast_fp16)[name = tensor("inputs_77_cast_fp16")]; + tensor var_10432 = const()[name = tensor("op_10432"), val = tensor([1])]; + tensor channels_mean_77_cast_fp16 = reduce_mean(axes = var_10432, keep_dims = var_8622, x = inputs_77_cast_fp16)[name = tensor("channels_mean_77_cast_fp16")]; + tensor zero_mean_77_cast_fp16 = sub(x = inputs_77_cast_fp16, y = channels_mean_77_cast_fp16)[name = tensor("zero_mean_77_cast_fp16")]; + tensor zero_mean_sq_77_cast_fp16 = mul(x = zero_mean_77_cast_fp16, y = zero_mean_77_cast_fp16)[name = tensor("zero_mean_sq_77_cast_fp16")]; + tensor var_10436 = const()[name = tensor("op_10436"), val = tensor([1])]; + tensor var_10437_cast_fp16 = reduce_mean(axes = var_10436, keep_dims = var_8622, x = zero_mean_sq_77_cast_fp16)[name = tensor("op_10437_cast_fp16")]; + tensor var_10438_to_fp16 = const()[name = tensor("op_10438_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_10439_cast_fp16 = add(x = var_10437_cast_fp16, y = var_10438_to_fp16)[name = tensor("op_10439_cast_fp16")]; + tensor denom_77_epsilon_0_to_fp16 = const()[name = tensor("denom_77_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_77_cast_fp16 = rsqrt(epsilon = denom_77_epsilon_0_to_fp16, x = var_10439_cast_fp16)[name = tensor("denom_77_cast_fp16")]; + tensor out_77_cast_fp16 = mul(x = zero_mean_77_cast_fp16, y = denom_77_cast_fp16)[name = tensor("out_77_cast_fp16")]; + tensor var_10443_to_fp16 = const()[name = tensor("op_10443_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1675221568)))]; + tensor var_10444_cast_fp16 = add(x = out_77_cast_fp16, y = var_10443_to_fp16)[name = tensor("op_10444_cast_fp16")]; + tensor var_10446_to_fp16 = const()[name = tensor("op_10446_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1675222912)))]; + tensor input_439_cast_fp16 = mul(x = var_10444_cast_fp16, y = var_10446_to_fp16)[name = tensor("input_439_cast_fp16")]; + tensor var_10454 = const()[name = tensor("op_10454"), val = tensor([1, 1])]; + tensor var_10456 = const()[name = tensor("op_10456"), val = tensor([1, 1])]; + tensor var_10458_pad_type_0 = const()[name = tensor("op_10458_pad_type_0"), val = tensor("custom")]; + tensor var_10458_pad_0 = const()[name = tensor("op_10458_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1675224256)))]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1681777920)))]; + tensor var_10458_cast_fp16 = conv(bias = up_blocks_2_attentions_2_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_10456, groups = var_8627, pad = var_10458_pad_0, pad_type = var_10458_pad_type_0, strides = var_10454, weight = up_blocks_2_attentions_2_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_439_cast_fp16)[name = tensor("op_10458_cast_fp16")]; + tensor var_10459_split_sizes_0 = const()[name = tensor("op_10459_split_sizes_0"), val = tensor([2560, 2560])]; + tensor var_10459_axis_0 = const()[name = tensor("op_10459_axis_0"), val = tensor(1)]; + tensor var_10459_cast_fp16_0, tensor var_10459_cast_fp16_1 = split(axis = var_10459_axis_0, split_sizes = var_10459_split_sizes_0, x = var_10458_cast_fp16)[name = tensor("op_10459_cast_fp16")]; + tensor var_10461_mode_0 = const()[name = tensor("op_10461_mode_0"), val = tensor("EXACT")]; + tensor var_10461_cast_fp16 = gelu(mode = var_10461_mode_0, x = var_10459_cast_fp16_1)[name = tensor("op_10461_cast_fp16")]; + tensor input_441_cast_fp16 = mul(x = var_10459_cast_fp16_0, y = var_10461_cast_fp16)[name = tensor("input_441_cast_fp16")]; + tensor var_10465 = const()[name = tensor("op_10465"), val = tensor([1, 1])]; + tensor var_10467 = const()[name = tensor("op_10467"), val = tensor([1, 1])]; + tensor var_10469_pad_type_0 = const()[name = tensor("op_10469_pad_type_0"), val = tensor("custom")]; + tensor var_10469_pad_0 = const()[name = tensor("op_10469_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1681788224)))]; + tensor up_blocks_2_attentions_2_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1685065088)))]; + tensor var_10469_cast_fp16 = conv(bias = up_blocks_2_attentions_2_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_10467, groups = var_8627, pad = var_10469_pad_0, pad_type = var_10469_pad_type_0, strides = var_10465, weight = up_blocks_2_attentions_2_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_441_cast_fp16)[name = tensor("op_10469_cast_fp16")]; + tensor hidden_states_273_cast_fp16 = add(x = var_10469_cast_fp16, y = inputs_77_cast_fp16)[name = tensor("hidden_states_273_cast_fp16")]; + tensor var_10471 = const()[name = tensor("op_10471"), val = tensor([2, 640, 24, 24])]; + tensor input_443_cast_fp16 = reshape(shape = var_10471, x = hidden_states_273_cast_fp16)[name = tensor("input_443_cast_fp16")]; + tensor var_10475 = const()[name = tensor("op_10475"), val = tensor([1, 1])]; + tensor var_10477 = const()[name = tensor("op_10477"), val = tensor([1, 1])]; + tensor hidden_states_275_pad_type_0 = const()[name = tensor("hidden_states_275_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_275_pad_0 = const()[name = tensor("hidden_states_275_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_2_attentions_2_proj_out_weight_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1685066432)))]; + tensor up_blocks_2_attentions_2_proj_out_bias_to_fp16 = const()[name = tensor("up_blocks_2_attentions_2_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1685885696)))]; + tensor hidden_states_275_cast_fp16 = conv(bias = up_blocks_2_attentions_2_proj_out_bias_to_fp16, dilations = var_10477, groups = var_8627, pad = hidden_states_275_pad_0, pad_type = hidden_states_275_pad_type_0, strides = var_10475, weight = up_blocks_2_attentions_2_proj_out_weight_to_fp16, x = input_443_cast_fp16)[name = tensor("hidden_states_275_cast_fp16")]; + tensor input_445_cast_fp16 = add(x = hidden_states_275_cast_fp16, y = hidden_states_263_cast_fp16)[name = tensor("input_445_cast_fp16")]; + tensor input_447_scale_factor_height_0 = const()[name = tensor("input_447_scale_factor_height_0"), val = tensor(0x1p+1)]; + tensor input_447_scale_factor_width_0 = const()[name = tensor("input_447_scale_factor_width_0"), val = tensor(0x1p+1)]; + tensor input_447_cast_fp16 = upsample_nearest_neighbor(scale_factor_height = input_447_scale_factor_height_0, scale_factor_width = input_447_scale_factor_width_0, x = input_445_cast_fp16)[name = tensor("input_447_cast_fp16")]; + tensor var_10486 = const()[name = tensor("op_10486"), val = tensor([1, 1])]; + tensor var_10488 = const()[name = tensor("op_10488"), val = tensor([1, 1])]; + tensor hidden_states_277_pad_type_0 = const()[name = tensor("hidden_states_277_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_277_pad_0 = const()[name = tensor("hidden_states_277_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_2_upsamplers_0_conv_weight_to_fp16 = const()[name = tensor("up_blocks_2_upsamplers_0_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1685887040)))]; + tensor up_blocks_2_upsamplers_0_conv_bias_to_fp16 = const()[name = tensor("up_blocks_2_upsamplers_0_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1693259904)))]; + tensor hidden_states_277_cast_fp16 = conv(bias = up_blocks_2_upsamplers_0_conv_bias_to_fp16, dilations = var_10488, groups = var_8627, pad = hidden_states_277_pad_0, pad_type = hidden_states_277_pad_type_0, strides = var_10486, weight = up_blocks_2_upsamplers_0_conv_weight_to_fp16, x = input_447_cast_fp16)[name = tensor("hidden_states_277_cast_fp16")]; + tensor var_10504 = const()[name = tensor("op_10504"), val = tensor(true)]; + tensor var_10509 = const()[name = tensor("op_10509"), val = tensor(1)]; + tensor input_449_interleave_0 = const()[name = tensor("input_449_interleave_0"), val = tensor(false)]; + tensor input_449_cast_fp16 = concat(axis = var_10509, interleave = input_449_interleave_0, values = (hidden_states_277_cast_fp16, input_61_cast_fp16))[name = tensor("input_449_cast_fp16")]; + tensor reshape_204_shape_0 = const()[name = tensor("reshape_204_shape_0"), val = tensor([2, 32, 30, 48, 48])]; + tensor reshape_204_cast_fp16 = reshape(shape = reshape_204_shape_0, x = input_449_cast_fp16)[name = tensor("reshape_204_cast_fp16")]; + tensor reduce_mean_153_axes_0 = const()[name = tensor("reduce_mean_153_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_153_keep_dims_0 = const()[name = tensor("reduce_mean_153_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_153_cast_fp16 = reduce_mean(axes = reduce_mean_153_axes_0, keep_dims = reduce_mean_153_keep_dims_0, x = reshape_204_cast_fp16)[name = tensor("reduce_mean_153_cast_fp16")]; + tensor sub_102_cast_fp16 = sub(x = reshape_204_cast_fp16, y = reduce_mean_153_cast_fp16)[name = tensor("sub_102_cast_fp16")]; + tensor square_51_cast_fp16 = square(x = sub_102_cast_fp16)[name = tensor("square_51_cast_fp16")]; + tensor reduce_mean_155_axes_0 = const()[name = tensor("reduce_mean_155_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_155_keep_dims_0 = const()[name = tensor("reduce_mean_155_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_155_cast_fp16 = reduce_mean(axes = reduce_mean_155_axes_0, keep_dims = reduce_mean_155_keep_dims_0, x = square_51_cast_fp16)[name = tensor("reduce_mean_155_cast_fp16")]; + tensor add_102_y_0_to_fp16 = const()[name = tensor("add_102_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_102_cast_fp16 = add(x = reduce_mean_155_cast_fp16, y = add_102_y_0_to_fp16)[name = tensor("add_102_cast_fp16")]; + tensor sqrt_51_cast_fp16 = sqrt(x = add_102_cast_fp16)[name = tensor("sqrt_51_cast_fp16")]; + tensor real_div_51_cast_fp16 = real_div(x = sub_102_cast_fp16, y = sqrt_51_cast_fp16)[name = tensor("real_div_51_cast_fp16")]; + tensor reshape_205_shape_0 = const()[name = tensor("reshape_205_shape_0"), val = tensor([2, 960, 48, 48])]; + tensor reshape_205_cast_fp16 = reshape(shape = reshape_205_shape_0, x = real_div_51_cast_fp16)[name = tensor("reshape_205_cast_fp16")]; + tensor add_103_gamma_0_to_fp16 = const()[name = tensor("add_103_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1693261248)))]; + tensor add_103_beta_0_to_fp16 = const()[name = tensor("add_103_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1693263232)))]; + tensor add_103_epsilon_0_to_fp16 = const()[name = tensor("add_103_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_103_cast_fp16 = batch_norm(beta = add_103_beta_0_to_fp16, epsilon = add_103_epsilon_0_to_fp16, gamma = add_103_gamma_0_to_fp16, mean = add_97_mean_0_to_fp16, variance = add_97_variance_0_to_fp16, x = reshape_205_cast_fp16)[name = tensor("add_103_cast_fp16")]; + tensor input_453_cast_fp16 = silu(x = add_103_cast_fp16)[name = tensor("input_453_cast_fp16")]; + tensor var_10536 = const()[name = tensor("op_10536"), val = tensor([1, 1])]; + tensor var_10538 = const()[name = tensor("op_10538"), val = tensor([1, 1])]; + tensor hidden_states_279_pad_type_0 = const()[name = tensor("hidden_states_279_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_279_pad_0 = const()[name = tensor("hidden_states_279_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_3_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1693265216)))]; + tensor up_blocks_3_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1698794880)))]; + tensor hidden_states_279_cast_fp16 = conv(bias = up_blocks_3_resnets_0_conv1_bias_to_fp16, dilations = var_10538, groups = var_10509, pad = hidden_states_279_pad_0, pad_type = hidden_states_279_pad_type_0, strides = var_10536, weight = up_blocks_3_resnets_0_conv1_weight_to_fp16, x = input_453_cast_fp16)[name = tensor("hidden_states_279_cast_fp16")]; + tensor var_10544 = const()[name = tensor("op_10544"), val = tensor([1, 1])]; + tensor var_10546 = const()[name = tensor("op_10546"), val = tensor([1, 1])]; + tensor temb_39_pad_type_0 = const()[name = tensor("temb_39_pad_type_0"), val = tensor("custom")]; + tensor temb_39_pad_0 = const()[name = tensor("temb_39_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1698795584)))]; + tensor up_blocks_3_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1699614848)))]; + tensor temb_39_cast_fp16 = conv(bias = up_blocks_3_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_10546, groups = var_10509, pad = temb_39_pad_0, pad_type = temb_39_pad_type_0, strides = var_10544, weight = up_blocks_3_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_39_cast_fp16")]; + tensor input_457_cast_fp16 = add(x = hidden_states_279_cast_fp16, y = temb_39_cast_fp16)[name = tensor("input_457_cast_fp16")]; + tensor reshape_208_shape_0 = const()[name = tensor("reshape_208_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_208_cast_fp16 = reshape(shape = reshape_208_shape_0, x = input_457_cast_fp16)[name = tensor("reshape_208_cast_fp16")]; + tensor reduce_mean_156_axes_0 = const()[name = tensor("reduce_mean_156_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_156_keep_dims_0 = const()[name = tensor("reduce_mean_156_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_156_cast_fp16 = reduce_mean(axes = reduce_mean_156_axes_0, keep_dims = reduce_mean_156_keep_dims_0, x = reshape_208_cast_fp16)[name = tensor("reduce_mean_156_cast_fp16")]; + tensor sub_104_cast_fp16 = sub(x = reshape_208_cast_fp16, y = reduce_mean_156_cast_fp16)[name = tensor("sub_104_cast_fp16")]; + tensor square_52_cast_fp16 = square(x = sub_104_cast_fp16)[name = tensor("square_52_cast_fp16")]; + tensor reduce_mean_158_axes_0 = const()[name = tensor("reduce_mean_158_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_158_keep_dims_0 = const()[name = tensor("reduce_mean_158_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_158_cast_fp16 = reduce_mean(axes = reduce_mean_158_axes_0, keep_dims = reduce_mean_158_keep_dims_0, x = square_52_cast_fp16)[name = tensor("reduce_mean_158_cast_fp16")]; + tensor add_104_y_0_to_fp16 = const()[name = tensor("add_104_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_104_cast_fp16 = add(x = reduce_mean_158_cast_fp16, y = add_104_y_0_to_fp16)[name = tensor("add_104_cast_fp16")]; + tensor sqrt_52_cast_fp16 = sqrt(x = add_104_cast_fp16)[name = tensor("sqrt_52_cast_fp16")]; + tensor real_div_52_cast_fp16 = real_div(x = sub_104_cast_fp16, y = sqrt_52_cast_fp16)[name = tensor("real_div_52_cast_fp16")]; + tensor reshape_209_shape_0 = const()[name = tensor("reshape_209_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_209_cast_fp16 = reshape(shape = reshape_209_shape_0, x = real_div_52_cast_fp16)[name = tensor("reshape_209_cast_fp16")]; + tensor add_105_gamma_0_to_fp16 = const()[name = tensor("add_105_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1699615552)))]; + tensor add_105_beta_0_to_fp16 = const()[name = tensor("add_105_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1699616256)))]; + tensor add_105_epsilon_0_to_fp16 = const()[name = tensor("add_105_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_105_cast_fp16 = batch_norm(beta = add_105_beta_0_to_fp16, epsilon = add_105_epsilon_0_to_fp16, gamma = add_105_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_209_cast_fp16)[name = tensor("add_105_cast_fp16")]; + tensor input_461_cast_fp16 = silu(x = add_105_cast_fp16)[name = tensor("input_461_cast_fp16")]; + tensor var_10556 = const()[name = tensor("op_10556"), val = tensor([1, 1])]; + tensor var_10558 = const()[name = tensor("op_10558"), val = tensor([1, 1])]; + tensor hidden_states_281_pad_type_0 = const()[name = tensor("hidden_states_281_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_281_pad_0 = const()[name = tensor("hidden_states_281_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_3_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1699616960)))]; + tensor up_blocks_3_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1701460224)))]; + tensor hidden_states_281_cast_fp16 = conv(bias = up_blocks_3_resnets_0_conv2_bias_to_fp16, dilations = var_10558, groups = var_10509, pad = hidden_states_281_pad_0, pad_type = hidden_states_281_pad_type_0, strides = var_10556, weight = up_blocks_3_resnets_0_conv2_weight_to_fp16, x = input_461_cast_fp16)[name = tensor("hidden_states_281_cast_fp16")]; + tensor var_10563 = const()[name = tensor("op_10563"), val = tensor([1, 1])]; + tensor var_10565 = const()[name = tensor("op_10565"), val = tensor([1, 1])]; + tensor x_23_pad_type_0 = const()[name = tensor("x_23_pad_type_0"), val = tensor("custom")]; + tensor x_23_pad_0 = const()[name = tensor("x_23_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_resnets_0_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_0_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1701460928)))]; + tensor up_blocks_3_resnets_0_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_0_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1702075392)))]; + tensor x_23_cast_fp16 = conv(bias = up_blocks_3_resnets_0_conv_shortcut_bias_to_fp16, dilations = var_10565, groups = var_10509, pad = x_23_pad_0, pad_type = x_23_pad_type_0, strides = var_10563, weight = up_blocks_3_resnets_0_conv_shortcut_weight_to_fp16, x = input_449_cast_fp16)[name = tensor("x_23_cast_fp16")]; + tensor hidden_states_283_cast_fp16 = add(x = x_23_cast_fp16, y = hidden_states_281_cast_fp16)[name = tensor("hidden_states_283_cast_fp16")]; + tensor reshape_212_shape_0 = const()[name = tensor("reshape_212_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_212_cast_fp16 = reshape(shape = reshape_212_shape_0, x = hidden_states_283_cast_fp16)[name = tensor("reshape_212_cast_fp16")]; + tensor reduce_mean_159_axes_0 = const()[name = tensor("reduce_mean_159_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_159_keep_dims_0 = const()[name = tensor("reduce_mean_159_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_159_cast_fp16 = reduce_mean(axes = reduce_mean_159_axes_0, keep_dims = reduce_mean_159_keep_dims_0, x = reshape_212_cast_fp16)[name = tensor("reduce_mean_159_cast_fp16")]; + tensor sub_106_cast_fp16 = sub(x = reshape_212_cast_fp16, y = reduce_mean_159_cast_fp16)[name = tensor("sub_106_cast_fp16")]; + tensor square_53_cast_fp16 = square(x = sub_106_cast_fp16)[name = tensor("square_53_cast_fp16")]; + tensor reduce_mean_161_axes_0 = const()[name = tensor("reduce_mean_161_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_161_keep_dims_0 = const()[name = tensor("reduce_mean_161_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_161_cast_fp16 = reduce_mean(axes = reduce_mean_161_axes_0, keep_dims = reduce_mean_161_keep_dims_0, x = square_53_cast_fp16)[name = tensor("reduce_mean_161_cast_fp16")]; + tensor add_106_y_0_to_fp16 = const()[name = tensor("add_106_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_106_cast_fp16 = add(x = reduce_mean_161_cast_fp16, y = add_106_y_0_to_fp16)[name = tensor("add_106_cast_fp16")]; + tensor sqrt_53_cast_fp16 = sqrt(x = add_106_cast_fp16)[name = tensor("sqrt_53_cast_fp16")]; + tensor real_div_53_cast_fp16 = real_div(x = sub_106_cast_fp16, y = sqrt_53_cast_fp16)[name = tensor("real_div_53_cast_fp16")]; + tensor reshape_213_shape_0 = const()[name = tensor("reshape_213_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_213_cast_fp16 = reshape(shape = reshape_213_shape_0, x = real_div_53_cast_fp16)[name = tensor("reshape_213_cast_fp16")]; + tensor add_107_gamma_0_to_fp16 = const()[name = tensor("add_107_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1702076096)))]; + tensor add_107_beta_0_to_fp16 = const()[name = tensor("add_107_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1702076800)))]; + tensor add_107_epsilon_0_to_fp16 = const()[name = tensor("add_107_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_107_cast_fp16 = batch_norm(beta = add_107_beta_0_to_fp16, epsilon = add_107_epsilon_0_to_fp16, gamma = add_107_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_213_cast_fp16)[name = tensor("add_107_cast_fp16")]; + tensor var_10585 = const()[name = tensor("op_10585"), val = tensor([1, 1])]; + tensor var_10587 = const()[name = tensor("op_10587"), val = tensor([1, 1])]; + tensor hidden_states_285_pad_type_0 = const()[name = tensor("hidden_states_285_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_285_pad_0 = const()[name = tensor("hidden_states_285_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_proj_in_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1702077504)))]; + tensor up_blocks_3_attentions_0_proj_in_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1702282368)))]; + tensor hidden_states_285_cast_fp16 = conv(bias = up_blocks_3_attentions_0_proj_in_bias_to_fp16, dilations = var_10587, groups = var_10509, pad = hidden_states_285_pad_0, pad_type = hidden_states_285_pad_type_0, strides = var_10585, weight = up_blocks_3_attentions_0_proj_in_weight_to_fp16, x = add_107_cast_fp16)[name = tensor("hidden_states_285_cast_fp16")]; + tensor var_10592 = const()[name = tensor("op_10592"), val = tensor([2, 320, 1, 2304])]; + tensor inputs_79_cast_fp16 = reshape(shape = var_10592, x = hidden_states_285_cast_fp16)[name = tensor("inputs_79_cast_fp16")]; + tensor var_10602 = const()[name = tensor("op_10602"), val = tensor([1])]; + tensor channels_mean_79_cast_fp16 = reduce_mean(axes = var_10602, keep_dims = var_10504, x = inputs_79_cast_fp16)[name = tensor("channels_mean_79_cast_fp16")]; + tensor zero_mean_79_cast_fp16 = sub(x = inputs_79_cast_fp16, y = channels_mean_79_cast_fp16)[name = tensor("zero_mean_79_cast_fp16")]; + tensor zero_mean_sq_79_cast_fp16 = mul(x = zero_mean_79_cast_fp16, y = zero_mean_79_cast_fp16)[name = tensor("zero_mean_sq_79_cast_fp16")]; + tensor var_10606 = const()[name = tensor("op_10606"), val = tensor([1])]; + tensor var_10607_cast_fp16 = reduce_mean(axes = var_10606, keep_dims = var_10504, x = zero_mean_sq_79_cast_fp16)[name = tensor("op_10607_cast_fp16")]; + tensor var_10608_to_fp16 = const()[name = tensor("op_10608_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_10609_cast_fp16 = add(x = var_10607_cast_fp16, y = var_10608_to_fp16)[name = tensor("op_10609_cast_fp16")]; + tensor denom_79_epsilon_0_to_fp16 = const()[name = tensor("denom_79_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_79_cast_fp16 = rsqrt(epsilon = denom_79_epsilon_0_to_fp16, x = var_10609_cast_fp16)[name = tensor("denom_79_cast_fp16")]; + tensor out_79_cast_fp16 = mul(x = zero_mean_79_cast_fp16, y = denom_79_cast_fp16)[name = tensor("out_79_cast_fp16")]; + tensor var_10613_to_fp16 = const()[name = tensor("op_10613_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1702283072)))]; + tensor var_10614_cast_fp16 = add(x = out_79_cast_fp16, y = var_10613_to_fp16)[name = tensor("op_10614_cast_fp16")]; + tensor var_10616_to_fp16 = const()[name = tensor("op_10616_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1702283776)))]; + tensor hidden_states_287_cast_fp16 = mul(x = var_10614_cast_fp16, y = var_10616_to_fp16)[name = tensor("hidden_states_287_cast_fp16")]; + tensor var_10623 = const()[name = tensor("op_10623"), val = tensor([1, 1])]; + tensor var_10625 = const()[name = tensor("op_10625"), val = tensor([1, 1])]; + tensor q_53_pad_type_0 = const()[name = tensor("q_53_pad_type_0"), val = tensor("custom")]; + tensor q_53_pad_0 = const()[name = tensor("q_53_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1702284480)))]; + tensor q_53_cast_fp16 = conv(dilations = var_10625, groups = var_10509, pad = q_53_pad_0, pad_type = q_53_pad_type_0, strides = var_10623, weight = up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_287_cast_fp16)[name = tensor("q_53_cast_fp16")]; + tensor var_10629 = const()[name = tensor("op_10629"), val = tensor([1, 1])]; + tensor var_10631 = const()[name = tensor("op_10631"), val = tensor([1, 1])]; + tensor k_105_pad_type_0 = const()[name = tensor("k_105_pad_type_0"), val = tensor("custom")]; + tensor k_105_pad_0 = const()[name = tensor("k_105_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1702489344)))]; + tensor k_105_cast_fp16 = conv(dilations = var_10631, groups = var_10509, pad = k_105_pad_0, pad_type = k_105_pad_type_0, strides = var_10629, weight = up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_287_cast_fp16)[name = tensor("k_105_cast_fp16")]; + tensor var_10635 = const()[name = tensor("op_10635"), val = tensor([1, 1])]; + tensor var_10637 = const()[name = tensor("op_10637"), val = tensor([1, 1])]; + tensor v_53_pad_type_0 = const()[name = tensor("v_53_pad_type_0"), val = tensor("custom")]; + tensor v_53_pad_0 = const()[name = tensor("v_53_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1702694208)))]; + tensor v_53_cast_fp16 = conv(dilations = var_10637, groups = var_10509, pad = v_53_pad_0, pad_type = v_53_pad_type_0, strides = var_10635, weight = up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_287_cast_fp16)[name = tensor("v_53_cast_fp16")]; + tensor var_10641_begin_0 = const()[name = tensor("op_10641_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_10641_end_0 = const()[name = tensor("op_10641_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_10641_end_mask_0 = const()[name = tensor("op_10641_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10641_cast_fp16 = slice_by_index(begin = var_10641_begin_0, end = var_10641_end_0, end_mask = var_10641_end_mask_0, x = q_53_cast_fp16)[name = tensor("op_10641_cast_fp16")]; + tensor var_10645_begin_0 = const()[name = tensor("op_10645_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_10645_end_0 = const()[name = tensor("op_10645_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_10645_end_mask_0 = const()[name = tensor("op_10645_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10645_cast_fp16 = slice_by_index(begin = var_10645_begin_0, end = var_10645_end_0, end_mask = var_10645_end_mask_0, x = q_53_cast_fp16)[name = tensor("op_10645_cast_fp16")]; + tensor var_10649_begin_0 = const()[name = tensor("op_10649_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_10649_end_0 = const()[name = tensor("op_10649_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_10649_end_mask_0 = const()[name = tensor("op_10649_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10649_cast_fp16 = slice_by_index(begin = var_10649_begin_0, end = var_10649_end_0, end_mask = var_10649_end_mask_0, x = q_53_cast_fp16)[name = tensor("op_10649_cast_fp16")]; + tensor var_10653_begin_0 = const()[name = tensor("op_10653_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_10653_end_0 = const()[name = tensor("op_10653_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_10653_end_mask_0 = const()[name = tensor("op_10653_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10653_cast_fp16 = slice_by_index(begin = var_10653_begin_0, end = var_10653_end_0, end_mask = var_10653_end_mask_0, x = q_53_cast_fp16)[name = tensor("op_10653_cast_fp16")]; + tensor var_10657_begin_0 = const()[name = tensor("op_10657_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_10657_end_0 = const()[name = tensor("op_10657_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_10657_end_mask_0 = const()[name = tensor("op_10657_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10657_cast_fp16 = slice_by_index(begin = var_10657_begin_0, end = var_10657_end_0, end_mask = var_10657_end_mask_0, x = q_53_cast_fp16)[name = tensor("op_10657_cast_fp16")]; + tensor k_107_perm_0 = const()[name = tensor("k_107_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_10664_begin_0 = const()[name = tensor("op_10664_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_10664_end_0 = const()[name = tensor("op_10664_end_0"), val = tensor([2, 2304, 1, 64])]; + tensor var_10664_end_mask_0 = const()[name = tensor("op_10664_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_5 = transpose(perm = k_107_perm_0, x = k_105_cast_fp16)[name = tensor("transpose_5")]; + tensor var_10664_cast_fp16 = slice_by_index(begin = var_10664_begin_0, end = var_10664_end_0, end_mask = var_10664_end_mask_0, x = transpose_5)[name = tensor("op_10664_cast_fp16")]; + tensor var_10668_begin_0 = const()[name = tensor("op_10668_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_10668_end_0 = const()[name = tensor("op_10668_end_0"), val = tensor([2, 2304, 1, 128])]; + tensor var_10668_end_mask_0 = const()[name = tensor("op_10668_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10668_cast_fp16 = slice_by_index(begin = var_10668_begin_0, end = var_10668_end_0, end_mask = var_10668_end_mask_0, x = transpose_5)[name = tensor("op_10668_cast_fp16")]; + tensor var_10672_begin_0 = const()[name = tensor("op_10672_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_10672_end_0 = const()[name = tensor("op_10672_end_0"), val = tensor([2, 2304, 1, 192])]; + tensor var_10672_end_mask_0 = const()[name = tensor("op_10672_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10672_cast_fp16 = slice_by_index(begin = var_10672_begin_0, end = var_10672_end_0, end_mask = var_10672_end_mask_0, x = transpose_5)[name = tensor("op_10672_cast_fp16")]; + tensor var_10676_begin_0 = const()[name = tensor("op_10676_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_10676_end_0 = const()[name = tensor("op_10676_end_0"), val = tensor([2, 2304, 1, 256])]; + tensor var_10676_end_mask_0 = const()[name = tensor("op_10676_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10676_cast_fp16 = slice_by_index(begin = var_10676_begin_0, end = var_10676_end_0, end_mask = var_10676_end_mask_0, x = transpose_5)[name = tensor("op_10676_cast_fp16")]; + tensor var_10680_begin_0 = const()[name = tensor("op_10680_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_10680_end_0 = const()[name = tensor("op_10680_end_0"), val = tensor([2, 2304, 1, 320])]; + tensor var_10680_end_mask_0 = const()[name = tensor("op_10680_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10680_cast_fp16 = slice_by_index(begin = var_10680_begin_0, end = var_10680_end_0, end_mask = var_10680_end_mask_0, x = transpose_5)[name = tensor("op_10680_cast_fp16")]; + tensor var_10682_begin_0 = const()[name = tensor("op_10682_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_10682_end_0 = const()[name = tensor("op_10682_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_10682_end_mask_0 = const()[name = tensor("op_10682_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10682_cast_fp16 = slice_by_index(begin = var_10682_begin_0, end = var_10682_end_0, end_mask = var_10682_end_mask_0, x = v_53_cast_fp16)[name = tensor("op_10682_cast_fp16")]; + tensor var_10686_begin_0 = const()[name = tensor("op_10686_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_10686_end_0 = const()[name = tensor("op_10686_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_10686_end_mask_0 = const()[name = tensor("op_10686_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10686_cast_fp16 = slice_by_index(begin = var_10686_begin_0, end = var_10686_end_0, end_mask = var_10686_end_mask_0, x = v_53_cast_fp16)[name = tensor("op_10686_cast_fp16")]; + tensor var_10690_begin_0 = const()[name = tensor("op_10690_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_10690_end_0 = const()[name = tensor("op_10690_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_10690_end_mask_0 = const()[name = tensor("op_10690_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10690_cast_fp16 = slice_by_index(begin = var_10690_begin_0, end = var_10690_end_0, end_mask = var_10690_end_mask_0, x = v_53_cast_fp16)[name = tensor("op_10690_cast_fp16")]; + tensor var_10694_begin_0 = const()[name = tensor("op_10694_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_10694_end_0 = const()[name = tensor("op_10694_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_10694_end_mask_0 = const()[name = tensor("op_10694_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10694_cast_fp16 = slice_by_index(begin = var_10694_begin_0, end = var_10694_end_0, end_mask = var_10694_end_mask_0, x = v_53_cast_fp16)[name = tensor("op_10694_cast_fp16")]; + tensor var_10698_begin_0 = const()[name = tensor("op_10698_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_10698_end_0 = const()[name = tensor("op_10698_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_10698_end_mask_0 = const()[name = tensor("op_10698_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10698_cast_fp16 = slice_by_index(begin = var_10698_begin_0, end = var_10698_end_0, end_mask = var_10698_end_mask_0, x = v_53_cast_fp16)[name = tensor("op_10698_cast_fp16")]; + tensor var_10702_equation_0 = const()[name = tensor("op_10702_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10702_cast_fp16 = einsum(equation = var_10702_equation_0, values = (var_10664_cast_fp16, var_10641_cast_fp16))[name = tensor("op_10702_cast_fp16")]; + tensor var_10703_to_fp16 = const()[name = tensor("op_10703_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_721_cast_fp16 = mul(x = var_10702_cast_fp16, y = var_10703_to_fp16)[name = tensor("aw_721_cast_fp16")]; + tensor var_10706_equation_0 = const()[name = tensor("op_10706_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10706_cast_fp16 = einsum(equation = var_10706_equation_0, values = (var_10668_cast_fp16, var_10645_cast_fp16))[name = tensor("op_10706_cast_fp16")]; + tensor var_10707_to_fp16 = const()[name = tensor("op_10707_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_723_cast_fp16 = mul(x = var_10706_cast_fp16, y = var_10707_to_fp16)[name = tensor("aw_723_cast_fp16")]; + tensor var_10710_equation_0 = const()[name = tensor("op_10710_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10710_cast_fp16 = einsum(equation = var_10710_equation_0, values = (var_10672_cast_fp16, var_10649_cast_fp16))[name = tensor("op_10710_cast_fp16")]; + tensor var_10711_to_fp16 = const()[name = tensor("op_10711_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_725_cast_fp16 = mul(x = var_10710_cast_fp16, y = var_10711_to_fp16)[name = tensor("aw_725_cast_fp16")]; + tensor var_10714_equation_0 = const()[name = tensor("op_10714_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10714_cast_fp16 = einsum(equation = var_10714_equation_0, values = (var_10676_cast_fp16, var_10653_cast_fp16))[name = tensor("op_10714_cast_fp16")]; + tensor var_10715_to_fp16 = const()[name = tensor("op_10715_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_727_cast_fp16 = mul(x = var_10714_cast_fp16, y = var_10715_to_fp16)[name = tensor("aw_727_cast_fp16")]; + tensor var_10718_equation_0 = const()[name = tensor("op_10718_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10718_cast_fp16 = einsum(equation = var_10718_equation_0, values = (var_10680_cast_fp16, var_10657_cast_fp16))[name = tensor("op_10718_cast_fp16")]; + tensor var_10719_to_fp16 = const()[name = tensor("op_10719_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_729_cast_fp16 = mul(x = var_10718_cast_fp16, y = var_10719_to_fp16)[name = tensor("aw_729_cast_fp16")]; + tensor var_10721_cast_fp16 = softmax(axis = var_10509, x = aw_721_cast_fp16)[name = tensor("op_10721_cast_fp16")]; + tensor var_10722_cast_fp16 = softmax(axis = var_10509, x = aw_723_cast_fp16)[name = tensor("op_10722_cast_fp16")]; + tensor var_10723_cast_fp16 = softmax(axis = var_10509, x = aw_725_cast_fp16)[name = tensor("op_10723_cast_fp16")]; + tensor var_10724_cast_fp16 = softmax(axis = var_10509, x = aw_727_cast_fp16)[name = tensor("op_10724_cast_fp16")]; + tensor var_10725_cast_fp16 = softmax(axis = var_10509, x = aw_729_cast_fp16)[name = tensor("op_10725_cast_fp16")]; + tensor var_10727_equation_0 = const()[name = tensor("op_10727_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10727_cast_fp16 = einsum(equation = var_10727_equation_0, values = (var_10682_cast_fp16, var_10721_cast_fp16))[name = tensor("op_10727_cast_fp16")]; + tensor var_10729_equation_0 = const()[name = tensor("op_10729_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10729_cast_fp16 = einsum(equation = var_10729_equation_0, values = (var_10686_cast_fp16, var_10722_cast_fp16))[name = tensor("op_10729_cast_fp16")]; + tensor var_10731_equation_0 = const()[name = tensor("op_10731_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10731_cast_fp16 = einsum(equation = var_10731_equation_0, values = (var_10690_cast_fp16, var_10723_cast_fp16))[name = tensor("op_10731_cast_fp16")]; + tensor var_10733_equation_0 = const()[name = tensor("op_10733_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10733_cast_fp16 = einsum(equation = var_10733_equation_0, values = (var_10694_cast_fp16, var_10724_cast_fp16))[name = tensor("op_10733_cast_fp16")]; + tensor var_10735_equation_0 = const()[name = tensor("op_10735_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10735_cast_fp16 = einsum(equation = var_10735_equation_0, values = (var_10698_cast_fp16, var_10725_cast_fp16))[name = tensor("op_10735_cast_fp16")]; + tensor input_465_interleave_0 = const()[name = tensor("input_465_interleave_0"), val = tensor(false)]; + tensor input_465_cast_fp16 = concat(axis = var_10509, interleave = input_465_interleave_0, values = (var_10727_cast_fp16, var_10729_cast_fp16, var_10731_cast_fp16, var_10733_cast_fp16, var_10735_cast_fp16))[name = tensor("input_465_cast_fp16")]; + tensor var_10741 = const()[name = tensor("op_10741"), val = tensor([1, 1])]; + tensor var_10743 = const()[name = tensor("op_10743"), val = tensor([1, 1])]; + tensor var_10745_pad_type_0 = const()[name = tensor("op_10745_pad_type_0"), val = tensor("custom")]; + tensor var_10745_pad_0 = const()[name = tensor("op_10745_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1702899072)))]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1703103936)))]; + tensor var_10745_cast_fp16 = conv(bias = up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_10743, groups = var_10509, pad = var_10745_pad_0, pad_type = var_10745_pad_type_0, strides = var_10741, weight = up_blocks_3_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_465_cast_fp16)[name = tensor("op_10745_cast_fp16")]; + tensor inputs_81_cast_fp16 = add(x = var_10745_cast_fp16, y = inputs_79_cast_fp16)[name = tensor("inputs_81_cast_fp16")]; + tensor var_10749 = const()[name = tensor("op_10749"), val = tensor([1])]; + tensor channels_mean_81_cast_fp16 = reduce_mean(axes = var_10749, keep_dims = var_10504, x = inputs_81_cast_fp16)[name = tensor("channels_mean_81_cast_fp16")]; + tensor zero_mean_81_cast_fp16 = sub(x = inputs_81_cast_fp16, y = channels_mean_81_cast_fp16)[name = tensor("zero_mean_81_cast_fp16")]; + tensor zero_mean_sq_81_cast_fp16 = mul(x = zero_mean_81_cast_fp16, y = zero_mean_81_cast_fp16)[name = tensor("zero_mean_sq_81_cast_fp16")]; + tensor var_10753 = const()[name = tensor("op_10753"), val = tensor([1])]; + tensor var_10754_cast_fp16 = reduce_mean(axes = var_10753, keep_dims = var_10504, x = zero_mean_sq_81_cast_fp16)[name = tensor("op_10754_cast_fp16")]; + tensor var_10755_to_fp16 = const()[name = tensor("op_10755_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_10756_cast_fp16 = add(x = var_10754_cast_fp16, y = var_10755_to_fp16)[name = tensor("op_10756_cast_fp16")]; + tensor denom_81_epsilon_0_to_fp16 = const()[name = tensor("denom_81_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_81_cast_fp16 = rsqrt(epsilon = denom_81_epsilon_0_to_fp16, x = var_10756_cast_fp16)[name = tensor("denom_81_cast_fp16")]; + tensor out_81_cast_fp16 = mul(x = zero_mean_81_cast_fp16, y = denom_81_cast_fp16)[name = tensor("out_81_cast_fp16")]; + tensor var_10760_to_fp16 = const()[name = tensor("op_10760_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1703104640)))]; + tensor var_10761_cast_fp16 = add(x = out_81_cast_fp16, y = var_10760_to_fp16)[name = tensor("op_10761_cast_fp16")]; + tensor var_10763_to_fp16 = const()[name = tensor("op_10763_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1703105344)))]; + tensor hidden_states_289_cast_fp16 = mul(x = var_10761_cast_fp16, y = var_10763_to_fp16)[name = tensor("hidden_states_289_cast_fp16")]; + tensor var_10770 = const()[name = tensor("op_10770"), val = tensor([1, 1])]; + tensor var_10772 = const()[name = tensor("op_10772"), val = tensor([1, 1])]; + tensor q_55_pad_type_0 = const()[name = tensor("q_55_pad_type_0"), val = tensor("custom")]; + tensor q_55_pad_0 = const()[name = tensor("q_55_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1703106048)))]; + tensor q_55_cast_fp16 = conv(dilations = var_10772, groups = var_10509, pad = q_55_pad_0, pad_type = q_55_pad_type_0, strides = var_10770, weight = up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_289_cast_fp16)[name = tensor("q_55_cast_fp16")]; + tensor var_10776 = const()[name = tensor("op_10776"), val = tensor([1, 1])]; + tensor var_10778 = const()[name = tensor("op_10778"), val = tensor([1, 1])]; + tensor k_109_pad_type_0 = const()[name = tensor("k_109_pad_type_0"), val = tensor("custom")]; + tensor k_109_pad_0 = const()[name = tensor("k_109_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1703310912)))]; + tensor k_109_cast_fp16 = conv(dilations = var_10778, groups = var_10509, pad = k_109_pad_0, pad_type = k_109_pad_type_0, strides = var_10776, weight = up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_109_cast_fp16")]; + tensor var_10782 = const()[name = tensor("op_10782"), val = tensor([1, 1])]; + tensor var_10784 = const()[name = tensor("op_10784"), val = tensor([1, 1])]; + tensor v_55_pad_type_0 = const()[name = tensor("v_55_pad_type_0"), val = tensor("custom")]; + tensor v_55_pad_0 = const()[name = tensor("v_55_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1703966336)))]; + tensor v_55_cast_fp16 = conv(dilations = var_10784, groups = var_10509, pad = v_55_pad_0, pad_type = v_55_pad_type_0, strides = var_10782, weight = up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_55_cast_fp16")]; + tensor var_10788_begin_0 = const()[name = tensor("op_10788_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_10788_end_0 = const()[name = tensor("op_10788_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_10788_end_mask_0 = const()[name = tensor("op_10788_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10788_cast_fp16 = slice_by_index(begin = var_10788_begin_0, end = var_10788_end_0, end_mask = var_10788_end_mask_0, x = q_55_cast_fp16)[name = tensor("op_10788_cast_fp16")]; + tensor var_10792_begin_0 = const()[name = tensor("op_10792_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_10792_end_0 = const()[name = tensor("op_10792_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_10792_end_mask_0 = const()[name = tensor("op_10792_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10792_cast_fp16 = slice_by_index(begin = var_10792_begin_0, end = var_10792_end_0, end_mask = var_10792_end_mask_0, x = q_55_cast_fp16)[name = tensor("op_10792_cast_fp16")]; + tensor var_10796_begin_0 = const()[name = tensor("op_10796_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_10796_end_0 = const()[name = tensor("op_10796_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_10796_end_mask_0 = const()[name = tensor("op_10796_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10796_cast_fp16 = slice_by_index(begin = var_10796_begin_0, end = var_10796_end_0, end_mask = var_10796_end_mask_0, x = q_55_cast_fp16)[name = tensor("op_10796_cast_fp16")]; + tensor var_10800_begin_0 = const()[name = tensor("op_10800_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_10800_end_0 = const()[name = tensor("op_10800_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_10800_end_mask_0 = const()[name = tensor("op_10800_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10800_cast_fp16 = slice_by_index(begin = var_10800_begin_0, end = var_10800_end_0, end_mask = var_10800_end_mask_0, x = q_55_cast_fp16)[name = tensor("op_10800_cast_fp16")]; + tensor var_10804_begin_0 = const()[name = tensor("op_10804_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_10804_end_0 = const()[name = tensor("op_10804_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_10804_end_mask_0 = const()[name = tensor("op_10804_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10804_cast_fp16 = slice_by_index(begin = var_10804_begin_0, end = var_10804_end_0, end_mask = var_10804_end_mask_0, x = q_55_cast_fp16)[name = tensor("op_10804_cast_fp16")]; + tensor k_111_perm_0 = const()[name = tensor("k_111_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_10811_begin_0 = const()[name = tensor("op_10811_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_10811_end_0 = const()[name = tensor("op_10811_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_10811_end_mask_0 = const()[name = tensor("op_10811_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_4 = transpose(perm = k_111_perm_0, x = k_109_cast_fp16)[name = tensor("transpose_4")]; + tensor var_10811_cast_fp16 = slice_by_index(begin = var_10811_begin_0, end = var_10811_end_0, end_mask = var_10811_end_mask_0, x = transpose_4)[name = tensor("op_10811_cast_fp16")]; + tensor var_10815_begin_0 = const()[name = tensor("op_10815_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_10815_end_0 = const()[name = tensor("op_10815_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_10815_end_mask_0 = const()[name = tensor("op_10815_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10815_cast_fp16 = slice_by_index(begin = var_10815_begin_0, end = var_10815_end_0, end_mask = var_10815_end_mask_0, x = transpose_4)[name = tensor("op_10815_cast_fp16")]; + tensor var_10819_begin_0 = const()[name = tensor("op_10819_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_10819_end_0 = const()[name = tensor("op_10819_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_10819_end_mask_0 = const()[name = tensor("op_10819_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10819_cast_fp16 = slice_by_index(begin = var_10819_begin_0, end = var_10819_end_0, end_mask = var_10819_end_mask_0, x = transpose_4)[name = tensor("op_10819_cast_fp16")]; + tensor var_10823_begin_0 = const()[name = tensor("op_10823_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_10823_end_0 = const()[name = tensor("op_10823_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_10823_end_mask_0 = const()[name = tensor("op_10823_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10823_cast_fp16 = slice_by_index(begin = var_10823_begin_0, end = var_10823_end_0, end_mask = var_10823_end_mask_0, x = transpose_4)[name = tensor("op_10823_cast_fp16")]; + tensor var_10827_begin_0 = const()[name = tensor("op_10827_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_10827_end_0 = const()[name = tensor("op_10827_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_10827_end_mask_0 = const()[name = tensor("op_10827_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_10827_cast_fp16 = slice_by_index(begin = var_10827_begin_0, end = var_10827_end_0, end_mask = var_10827_end_mask_0, x = transpose_4)[name = tensor("op_10827_cast_fp16")]; + tensor var_10829_begin_0 = const()[name = tensor("op_10829_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_10829_end_0 = const()[name = tensor("op_10829_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_10829_end_mask_0 = const()[name = tensor("op_10829_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10829_cast_fp16 = slice_by_index(begin = var_10829_begin_0, end = var_10829_end_0, end_mask = var_10829_end_mask_0, x = v_55_cast_fp16)[name = tensor("op_10829_cast_fp16")]; + tensor var_10833_begin_0 = const()[name = tensor("op_10833_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_10833_end_0 = const()[name = tensor("op_10833_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_10833_end_mask_0 = const()[name = tensor("op_10833_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10833_cast_fp16 = slice_by_index(begin = var_10833_begin_0, end = var_10833_end_0, end_mask = var_10833_end_mask_0, x = v_55_cast_fp16)[name = tensor("op_10833_cast_fp16")]; + tensor var_10837_begin_0 = const()[name = tensor("op_10837_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_10837_end_0 = const()[name = tensor("op_10837_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_10837_end_mask_0 = const()[name = tensor("op_10837_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10837_cast_fp16 = slice_by_index(begin = var_10837_begin_0, end = var_10837_end_0, end_mask = var_10837_end_mask_0, x = v_55_cast_fp16)[name = tensor("op_10837_cast_fp16")]; + tensor var_10841_begin_0 = const()[name = tensor("op_10841_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_10841_end_0 = const()[name = tensor("op_10841_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_10841_end_mask_0 = const()[name = tensor("op_10841_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10841_cast_fp16 = slice_by_index(begin = var_10841_begin_0, end = var_10841_end_0, end_mask = var_10841_end_mask_0, x = v_55_cast_fp16)[name = tensor("op_10841_cast_fp16")]; + tensor var_10845_begin_0 = const()[name = tensor("op_10845_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_10845_end_0 = const()[name = tensor("op_10845_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_10845_end_mask_0 = const()[name = tensor("op_10845_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_10845_cast_fp16 = slice_by_index(begin = var_10845_begin_0, end = var_10845_end_0, end_mask = var_10845_end_mask_0, x = v_55_cast_fp16)[name = tensor("op_10845_cast_fp16")]; + tensor var_10849_equation_0 = const()[name = tensor("op_10849_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10849_cast_fp16 = einsum(equation = var_10849_equation_0, values = (var_10811_cast_fp16, var_10788_cast_fp16))[name = tensor("op_10849_cast_fp16")]; + tensor var_10850_to_fp16 = const()[name = tensor("op_10850_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_731_cast_fp16 = mul(x = var_10849_cast_fp16, y = var_10850_to_fp16)[name = tensor("aw_731_cast_fp16")]; + tensor var_10853_equation_0 = const()[name = tensor("op_10853_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10853_cast_fp16 = einsum(equation = var_10853_equation_0, values = (var_10815_cast_fp16, var_10792_cast_fp16))[name = tensor("op_10853_cast_fp16")]; + tensor var_10854_to_fp16 = const()[name = tensor("op_10854_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_733_cast_fp16 = mul(x = var_10853_cast_fp16, y = var_10854_to_fp16)[name = tensor("aw_733_cast_fp16")]; + tensor var_10857_equation_0 = const()[name = tensor("op_10857_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10857_cast_fp16 = einsum(equation = var_10857_equation_0, values = (var_10819_cast_fp16, var_10796_cast_fp16))[name = tensor("op_10857_cast_fp16")]; + tensor var_10858_to_fp16 = const()[name = tensor("op_10858_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_735_cast_fp16 = mul(x = var_10857_cast_fp16, y = var_10858_to_fp16)[name = tensor("aw_735_cast_fp16")]; + tensor var_10861_equation_0 = const()[name = tensor("op_10861_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10861_cast_fp16 = einsum(equation = var_10861_equation_0, values = (var_10823_cast_fp16, var_10800_cast_fp16))[name = tensor("op_10861_cast_fp16")]; + tensor var_10862_to_fp16 = const()[name = tensor("op_10862_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_737_cast_fp16 = mul(x = var_10861_cast_fp16, y = var_10862_to_fp16)[name = tensor("aw_737_cast_fp16")]; + tensor var_10865_equation_0 = const()[name = tensor("op_10865_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_10865_cast_fp16 = einsum(equation = var_10865_equation_0, values = (var_10827_cast_fp16, var_10804_cast_fp16))[name = tensor("op_10865_cast_fp16")]; + tensor var_10866_to_fp16 = const()[name = tensor("op_10866_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_739_cast_fp16 = mul(x = var_10865_cast_fp16, y = var_10866_to_fp16)[name = tensor("aw_739_cast_fp16")]; + tensor var_10868_cast_fp16 = softmax(axis = var_10509, x = aw_731_cast_fp16)[name = tensor("op_10868_cast_fp16")]; + tensor var_10869_cast_fp16 = softmax(axis = var_10509, x = aw_733_cast_fp16)[name = tensor("op_10869_cast_fp16")]; + tensor var_10870_cast_fp16 = softmax(axis = var_10509, x = aw_735_cast_fp16)[name = tensor("op_10870_cast_fp16")]; + tensor var_10871_cast_fp16 = softmax(axis = var_10509, x = aw_737_cast_fp16)[name = tensor("op_10871_cast_fp16")]; + tensor var_10872_cast_fp16 = softmax(axis = var_10509, x = aw_739_cast_fp16)[name = tensor("op_10872_cast_fp16")]; + tensor var_10874_equation_0 = const()[name = tensor("op_10874_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10874_cast_fp16 = einsum(equation = var_10874_equation_0, values = (var_10829_cast_fp16, var_10868_cast_fp16))[name = tensor("op_10874_cast_fp16")]; + tensor var_10876_equation_0 = const()[name = tensor("op_10876_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10876_cast_fp16 = einsum(equation = var_10876_equation_0, values = (var_10833_cast_fp16, var_10869_cast_fp16))[name = tensor("op_10876_cast_fp16")]; + tensor var_10878_equation_0 = const()[name = tensor("op_10878_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10878_cast_fp16 = einsum(equation = var_10878_equation_0, values = (var_10837_cast_fp16, var_10870_cast_fp16))[name = tensor("op_10878_cast_fp16")]; + tensor var_10880_equation_0 = const()[name = tensor("op_10880_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10880_cast_fp16 = einsum(equation = var_10880_equation_0, values = (var_10841_cast_fp16, var_10871_cast_fp16))[name = tensor("op_10880_cast_fp16")]; + tensor var_10882_equation_0 = const()[name = tensor("op_10882_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_10882_cast_fp16 = einsum(equation = var_10882_equation_0, values = (var_10845_cast_fp16, var_10872_cast_fp16))[name = tensor("op_10882_cast_fp16")]; + tensor input_467_interleave_0 = const()[name = tensor("input_467_interleave_0"), val = tensor(false)]; + tensor input_467_cast_fp16 = concat(axis = var_10509, interleave = input_467_interleave_0, values = (var_10874_cast_fp16, var_10876_cast_fp16, var_10878_cast_fp16, var_10880_cast_fp16, var_10882_cast_fp16))[name = tensor("input_467_cast_fp16")]; + tensor var_10888 = const()[name = tensor("op_10888"), val = tensor([1, 1])]; + tensor var_10890 = const()[name = tensor("op_10890"), val = tensor([1, 1])]; + tensor var_10892_pad_type_0 = const()[name = tensor("op_10892_pad_type_0"), val = tensor("custom")]; + tensor var_10892_pad_0 = const()[name = tensor("op_10892_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1704621760)))]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1704826624)))]; + tensor var_10892_cast_fp16 = conv(bias = up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_10890, groups = var_10509, pad = var_10892_pad_0, pad_type = var_10892_pad_type_0, strides = var_10888, weight = up_blocks_3_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_467_cast_fp16)[name = tensor("op_10892_cast_fp16")]; + tensor inputs_83_cast_fp16 = add(x = var_10892_cast_fp16, y = inputs_81_cast_fp16)[name = tensor("inputs_83_cast_fp16")]; + tensor var_10896 = const()[name = tensor("op_10896"), val = tensor([1])]; + tensor channels_mean_83_cast_fp16 = reduce_mean(axes = var_10896, keep_dims = var_10504, x = inputs_83_cast_fp16)[name = tensor("channels_mean_83_cast_fp16")]; + tensor zero_mean_83_cast_fp16 = sub(x = inputs_83_cast_fp16, y = channels_mean_83_cast_fp16)[name = tensor("zero_mean_83_cast_fp16")]; + tensor zero_mean_sq_83_cast_fp16 = mul(x = zero_mean_83_cast_fp16, y = zero_mean_83_cast_fp16)[name = tensor("zero_mean_sq_83_cast_fp16")]; + tensor var_10900 = const()[name = tensor("op_10900"), val = tensor([1])]; + tensor var_10901_cast_fp16 = reduce_mean(axes = var_10900, keep_dims = var_10504, x = zero_mean_sq_83_cast_fp16)[name = tensor("op_10901_cast_fp16")]; + tensor var_10902_to_fp16 = const()[name = tensor("op_10902_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_10903_cast_fp16 = add(x = var_10901_cast_fp16, y = var_10902_to_fp16)[name = tensor("op_10903_cast_fp16")]; + tensor denom_83_epsilon_0_to_fp16 = const()[name = tensor("denom_83_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_83_cast_fp16 = rsqrt(epsilon = denom_83_epsilon_0_to_fp16, x = var_10903_cast_fp16)[name = tensor("denom_83_cast_fp16")]; + tensor out_83_cast_fp16 = mul(x = zero_mean_83_cast_fp16, y = denom_83_cast_fp16)[name = tensor("out_83_cast_fp16")]; + tensor var_10907_to_fp16 = const()[name = tensor("op_10907_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1704827328)))]; + tensor var_10908_cast_fp16 = add(x = out_83_cast_fp16, y = var_10907_to_fp16)[name = tensor("op_10908_cast_fp16")]; + tensor var_10910_to_fp16 = const()[name = tensor("op_10910_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1704828032)))]; + tensor input_469_cast_fp16 = mul(x = var_10908_cast_fp16, y = var_10910_to_fp16)[name = tensor("input_469_cast_fp16")]; + tensor var_10918 = const()[name = tensor("op_10918"), val = tensor([1, 1])]; + tensor var_10920 = const()[name = tensor("op_10920"), val = tensor([1, 1])]; + tensor var_10922_pad_type_0 = const()[name = tensor("op_10922_pad_type_0"), val = tensor("custom")]; + tensor var_10922_pad_0 = const()[name = tensor("op_10922_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1704828736)))]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1706467200)))]; + tensor var_10922_cast_fp16 = conv(bias = up_blocks_3_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_10920, groups = var_10509, pad = var_10922_pad_0, pad_type = var_10922_pad_type_0, strides = var_10918, weight = up_blocks_3_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_469_cast_fp16)[name = tensor("op_10922_cast_fp16")]; + tensor var_10923_split_sizes_0 = const()[name = tensor("op_10923_split_sizes_0"), val = tensor([1280, 1280])]; + tensor var_10923_axis_0 = const()[name = tensor("op_10923_axis_0"), val = tensor(1)]; + tensor var_10923_cast_fp16_0, tensor var_10923_cast_fp16_1 = split(axis = var_10923_axis_0, split_sizes = var_10923_split_sizes_0, x = var_10922_cast_fp16)[name = tensor("op_10923_cast_fp16")]; + tensor var_10925_mode_0 = const()[name = tensor("op_10925_mode_0"), val = tensor("EXACT")]; + tensor var_10925_cast_fp16 = gelu(mode = var_10925_mode_0, x = var_10923_cast_fp16_1)[name = tensor("op_10925_cast_fp16")]; + tensor input_471_cast_fp16 = mul(x = var_10923_cast_fp16_0, y = var_10925_cast_fp16)[name = tensor("input_471_cast_fp16")]; + tensor var_10929 = const()[name = tensor("op_10929"), val = tensor([1, 1])]; + tensor var_10931 = const()[name = tensor("op_10931"), val = tensor([1, 1])]; + tensor var_10933_pad_type_0 = const()[name = tensor("op_10933_pad_type_0"), val = tensor("custom")]; + tensor var_10933_pad_0 = const()[name = tensor("op_10933_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1706472384)))]; + tensor up_blocks_3_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1707291648)))]; + tensor var_10933_cast_fp16 = conv(bias = up_blocks_3_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_10931, groups = var_10509, pad = var_10933_pad_0, pad_type = var_10933_pad_type_0, strides = var_10929, weight = up_blocks_3_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_471_cast_fp16)[name = tensor("op_10933_cast_fp16")]; + tensor hidden_states_293_cast_fp16 = add(x = var_10933_cast_fp16, y = inputs_83_cast_fp16)[name = tensor("hidden_states_293_cast_fp16")]; + tensor var_10935 = const()[name = tensor("op_10935"), val = tensor([2, 320, 48, 48])]; + tensor input_473_cast_fp16 = reshape(shape = var_10935, x = hidden_states_293_cast_fp16)[name = tensor("input_473_cast_fp16")]; + tensor var_10939 = const()[name = tensor("op_10939"), val = tensor([1, 1])]; + tensor var_10941 = const()[name = tensor("op_10941"), val = tensor([1, 1])]; + tensor hidden_states_295_pad_type_0 = const()[name = tensor("hidden_states_295_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_295_pad_0 = const()[name = tensor("hidden_states_295_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_0_proj_out_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1707292352)))]; + tensor up_blocks_3_attentions_0_proj_out_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_0_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1707497216)))]; + tensor hidden_states_295_cast_fp16 = conv(bias = up_blocks_3_attentions_0_proj_out_bias_to_fp16, dilations = var_10941, groups = var_10509, pad = hidden_states_295_pad_0, pad_type = hidden_states_295_pad_type_0, strides = var_10939, weight = up_blocks_3_attentions_0_proj_out_weight_to_fp16, x = input_473_cast_fp16)[name = tensor("hidden_states_295_cast_fp16")]; + tensor hidden_states_297_cast_fp16 = add(x = hidden_states_295_cast_fp16, y = hidden_states_283_cast_fp16)[name = tensor("hidden_states_297_cast_fp16")]; + tensor input_475_interleave_0 = const()[name = tensor("input_475_interleave_0"), val = tensor(false)]; + tensor input_475_cast_fp16 = concat(axis = var_10509, interleave = input_475_interleave_0, values = (hidden_states_297_cast_fp16, input_35_cast_fp16))[name = tensor("input_475_cast_fp16")]; + tensor reshape_216_shape_0 = const()[name = tensor("reshape_216_shape_0"), val = tensor([2, 32, 20, 48, 48])]; + tensor reshape_216_cast_fp16 = reshape(shape = reshape_216_shape_0, x = input_475_cast_fp16)[name = tensor("reshape_216_cast_fp16")]; + tensor reduce_mean_162_axes_0 = const()[name = tensor("reduce_mean_162_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_162_keep_dims_0 = const()[name = tensor("reduce_mean_162_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_162_cast_fp16 = reduce_mean(axes = reduce_mean_162_axes_0, keep_dims = reduce_mean_162_keep_dims_0, x = reshape_216_cast_fp16)[name = tensor("reduce_mean_162_cast_fp16")]; + tensor sub_108_cast_fp16 = sub(x = reshape_216_cast_fp16, y = reduce_mean_162_cast_fp16)[name = tensor("sub_108_cast_fp16")]; + tensor square_54_cast_fp16 = square(x = sub_108_cast_fp16)[name = tensor("square_54_cast_fp16")]; + tensor reduce_mean_164_axes_0 = const()[name = tensor("reduce_mean_164_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_164_keep_dims_0 = const()[name = tensor("reduce_mean_164_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_164_cast_fp16 = reduce_mean(axes = reduce_mean_164_axes_0, keep_dims = reduce_mean_164_keep_dims_0, x = square_54_cast_fp16)[name = tensor("reduce_mean_164_cast_fp16")]; + tensor add_108_y_0_to_fp16 = const()[name = tensor("add_108_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_108_cast_fp16 = add(x = reduce_mean_164_cast_fp16, y = add_108_y_0_to_fp16)[name = tensor("add_108_cast_fp16")]; + tensor sqrt_54_cast_fp16 = sqrt(x = add_108_cast_fp16)[name = tensor("sqrt_54_cast_fp16")]; + tensor real_div_54_cast_fp16 = real_div(x = sub_108_cast_fp16, y = sqrt_54_cast_fp16)[name = tensor("real_div_54_cast_fp16")]; + tensor reshape_217_shape_0 = const()[name = tensor("reshape_217_shape_0"), val = tensor([2, 640, 48, 48])]; + tensor reshape_217_cast_fp16 = reshape(shape = reshape_217_shape_0, x = real_div_54_cast_fp16)[name = tensor("reshape_217_cast_fp16")]; + tensor add_109_gamma_0_to_fp16 = const()[name = tensor("add_109_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1707497920)))]; + tensor add_109_beta_0_to_fp16 = const()[name = tensor("add_109_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1707499264)))]; + tensor add_109_epsilon_0_to_fp16 = const()[name = tensor("add_109_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_109_cast_fp16 = batch_norm(beta = add_109_beta_0_to_fp16, epsilon = add_109_epsilon_0_to_fp16, gamma = add_109_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_217_cast_fp16)[name = tensor("add_109_cast_fp16")]; + tensor input_479_cast_fp16 = silu(x = add_109_cast_fp16)[name = tensor("input_479_cast_fp16")]; + tensor var_10959 = const()[name = tensor("op_10959"), val = tensor([1, 1])]; + tensor var_10961 = const()[name = tensor("op_10961"), val = tensor([1, 1])]; + tensor hidden_states_299_pad_type_0 = const()[name = tensor("hidden_states_299_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_299_pad_0 = const()[name = tensor("hidden_states_299_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_3_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1707500608)))]; + tensor up_blocks_3_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1711187072)))]; + tensor hidden_states_299_cast_fp16 = conv(bias = up_blocks_3_resnets_1_conv1_bias_to_fp16, dilations = var_10961, groups = var_10509, pad = hidden_states_299_pad_0, pad_type = hidden_states_299_pad_type_0, strides = var_10959, weight = up_blocks_3_resnets_1_conv1_weight_to_fp16, x = input_479_cast_fp16)[name = tensor("hidden_states_299_cast_fp16")]; + tensor var_10967 = const()[name = tensor("op_10967"), val = tensor([1, 1])]; + tensor var_10969 = const()[name = tensor("op_10969"), val = tensor([1, 1])]; + tensor temb_41_pad_type_0 = const()[name = tensor("temb_41_pad_type_0"), val = tensor("custom")]; + tensor temb_41_pad_0 = const()[name = tensor("temb_41_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1711187776)))]; + tensor up_blocks_3_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1712007040)))]; + tensor temb_41_cast_fp16 = conv(bias = up_blocks_3_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_10969, groups = var_10509, pad = temb_41_pad_0, pad_type = temb_41_pad_type_0, strides = var_10967, weight = up_blocks_3_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_41_cast_fp16")]; + tensor input_483_cast_fp16 = add(x = hidden_states_299_cast_fp16, y = temb_41_cast_fp16)[name = tensor("input_483_cast_fp16")]; + tensor reshape_220_shape_0 = const()[name = tensor("reshape_220_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_220_cast_fp16 = reshape(shape = reshape_220_shape_0, x = input_483_cast_fp16)[name = tensor("reshape_220_cast_fp16")]; + tensor reduce_mean_165_axes_0 = const()[name = tensor("reduce_mean_165_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_165_keep_dims_0 = const()[name = tensor("reduce_mean_165_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_165_cast_fp16 = reduce_mean(axes = reduce_mean_165_axes_0, keep_dims = reduce_mean_165_keep_dims_0, x = reshape_220_cast_fp16)[name = tensor("reduce_mean_165_cast_fp16")]; + tensor sub_110_cast_fp16 = sub(x = reshape_220_cast_fp16, y = reduce_mean_165_cast_fp16)[name = tensor("sub_110_cast_fp16")]; + tensor square_55_cast_fp16 = square(x = sub_110_cast_fp16)[name = tensor("square_55_cast_fp16")]; + tensor reduce_mean_167_axes_0 = const()[name = tensor("reduce_mean_167_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_167_keep_dims_0 = const()[name = tensor("reduce_mean_167_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_167_cast_fp16 = reduce_mean(axes = reduce_mean_167_axes_0, keep_dims = reduce_mean_167_keep_dims_0, x = square_55_cast_fp16)[name = tensor("reduce_mean_167_cast_fp16")]; + tensor add_110_y_0_to_fp16 = const()[name = tensor("add_110_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_110_cast_fp16 = add(x = reduce_mean_167_cast_fp16, y = add_110_y_0_to_fp16)[name = tensor("add_110_cast_fp16")]; + tensor sqrt_55_cast_fp16 = sqrt(x = add_110_cast_fp16)[name = tensor("sqrt_55_cast_fp16")]; + tensor real_div_55_cast_fp16 = real_div(x = sub_110_cast_fp16, y = sqrt_55_cast_fp16)[name = tensor("real_div_55_cast_fp16")]; + tensor reshape_221_shape_0 = const()[name = tensor("reshape_221_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_221_cast_fp16 = reshape(shape = reshape_221_shape_0, x = real_div_55_cast_fp16)[name = tensor("reshape_221_cast_fp16")]; + tensor add_111_gamma_0_to_fp16 = const()[name = tensor("add_111_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1712007744)))]; + tensor add_111_beta_0_to_fp16 = const()[name = tensor("add_111_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1712008448)))]; + tensor add_111_epsilon_0_to_fp16 = const()[name = tensor("add_111_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_111_cast_fp16 = batch_norm(beta = add_111_beta_0_to_fp16, epsilon = add_111_epsilon_0_to_fp16, gamma = add_111_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_221_cast_fp16)[name = tensor("add_111_cast_fp16")]; + tensor input_487_cast_fp16 = silu(x = add_111_cast_fp16)[name = tensor("input_487_cast_fp16")]; + tensor var_10979 = const()[name = tensor("op_10979"), val = tensor([1, 1])]; + tensor var_10981 = const()[name = tensor("op_10981"), val = tensor([1, 1])]; + tensor hidden_states_301_pad_type_0 = const()[name = tensor("hidden_states_301_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_301_pad_0 = const()[name = tensor("hidden_states_301_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_3_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1712009152)))]; + tensor up_blocks_3_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1713852416)))]; + tensor hidden_states_301_cast_fp16 = conv(bias = up_blocks_3_resnets_1_conv2_bias_to_fp16, dilations = var_10981, groups = var_10509, pad = hidden_states_301_pad_0, pad_type = hidden_states_301_pad_type_0, strides = var_10979, weight = up_blocks_3_resnets_1_conv2_weight_to_fp16, x = input_487_cast_fp16)[name = tensor("hidden_states_301_cast_fp16")]; + tensor var_10986 = const()[name = tensor("op_10986"), val = tensor([1, 1])]; + tensor var_10988 = const()[name = tensor("op_10988"), val = tensor([1, 1])]; + tensor x_25_pad_type_0 = const()[name = tensor("x_25_pad_type_0"), val = tensor("custom")]; + tensor x_25_pad_0 = const()[name = tensor("x_25_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_resnets_1_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_1_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1713853120)))]; + tensor up_blocks_3_resnets_1_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_1_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1714262784)))]; + tensor x_25_cast_fp16 = conv(bias = up_blocks_3_resnets_1_conv_shortcut_bias_to_fp16, dilations = var_10988, groups = var_10509, pad = x_25_pad_0, pad_type = x_25_pad_type_0, strides = var_10986, weight = up_blocks_3_resnets_1_conv_shortcut_weight_to_fp16, x = input_475_cast_fp16)[name = tensor("x_25_cast_fp16")]; + tensor hidden_states_303_cast_fp16 = add(x = x_25_cast_fp16, y = hidden_states_301_cast_fp16)[name = tensor("hidden_states_303_cast_fp16")]; + tensor reshape_224_shape_0 = const()[name = tensor("reshape_224_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_224_cast_fp16 = reshape(shape = reshape_224_shape_0, x = hidden_states_303_cast_fp16)[name = tensor("reshape_224_cast_fp16")]; + tensor reduce_mean_168_axes_0 = const()[name = tensor("reduce_mean_168_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_168_keep_dims_0 = const()[name = tensor("reduce_mean_168_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_168_cast_fp16 = reduce_mean(axes = reduce_mean_168_axes_0, keep_dims = reduce_mean_168_keep_dims_0, x = reshape_224_cast_fp16)[name = tensor("reduce_mean_168_cast_fp16")]; + tensor sub_112_cast_fp16 = sub(x = reshape_224_cast_fp16, y = reduce_mean_168_cast_fp16)[name = tensor("sub_112_cast_fp16")]; + tensor square_56_cast_fp16 = square(x = sub_112_cast_fp16)[name = tensor("square_56_cast_fp16")]; + tensor reduce_mean_170_axes_0 = const()[name = tensor("reduce_mean_170_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_170_keep_dims_0 = const()[name = tensor("reduce_mean_170_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_170_cast_fp16 = reduce_mean(axes = reduce_mean_170_axes_0, keep_dims = reduce_mean_170_keep_dims_0, x = square_56_cast_fp16)[name = tensor("reduce_mean_170_cast_fp16")]; + tensor add_112_y_0_to_fp16 = const()[name = tensor("add_112_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_112_cast_fp16 = add(x = reduce_mean_170_cast_fp16, y = add_112_y_0_to_fp16)[name = tensor("add_112_cast_fp16")]; + tensor sqrt_56_cast_fp16 = sqrt(x = add_112_cast_fp16)[name = tensor("sqrt_56_cast_fp16")]; + tensor real_div_56_cast_fp16 = real_div(x = sub_112_cast_fp16, y = sqrt_56_cast_fp16)[name = tensor("real_div_56_cast_fp16")]; + tensor reshape_225_shape_0 = const()[name = tensor("reshape_225_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_225_cast_fp16 = reshape(shape = reshape_225_shape_0, x = real_div_56_cast_fp16)[name = tensor("reshape_225_cast_fp16")]; + tensor add_113_gamma_0_to_fp16 = const()[name = tensor("add_113_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1714263488)))]; + tensor add_113_beta_0_to_fp16 = const()[name = tensor("add_113_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1714264192)))]; + tensor add_113_epsilon_0_to_fp16 = const()[name = tensor("add_113_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_113_cast_fp16 = batch_norm(beta = add_113_beta_0_to_fp16, epsilon = add_113_epsilon_0_to_fp16, gamma = add_113_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_225_cast_fp16)[name = tensor("add_113_cast_fp16")]; + tensor var_11008 = const()[name = tensor("op_11008"), val = tensor([1, 1])]; + tensor var_11010 = const()[name = tensor("op_11010"), val = tensor([1, 1])]; + tensor hidden_states_305_pad_type_0 = const()[name = tensor("hidden_states_305_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_305_pad_0 = const()[name = tensor("hidden_states_305_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_proj_in_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1714264896)))]; + tensor up_blocks_3_attentions_1_proj_in_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1714469760)))]; + tensor hidden_states_305_cast_fp16 = conv(bias = up_blocks_3_attentions_1_proj_in_bias_to_fp16, dilations = var_11010, groups = var_10509, pad = hidden_states_305_pad_0, pad_type = hidden_states_305_pad_type_0, strides = var_11008, weight = up_blocks_3_attentions_1_proj_in_weight_to_fp16, x = add_113_cast_fp16)[name = tensor("hidden_states_305_cast_fp16")]; + tensor var_11015 = const()[name = tensor("op_11015"), val = tensor([2, 320, 1, 2304])]; + tensor inputs_85_cast_fp16 = reshape(shape = var_11015, x = hidden_states_305_cast_fp16)[name = tensor("inputs_85_cast_fp16")]; + tensor var_11025 = const()[name = tensor("op_11025"), val = tensor([1])]; + tensor channels_mean_85_cast_fp16 = reduce_mean(axes = var_11025, keep_dims = var_10504, x = inputs_85_cast_fp16)[name = tensor("channels_mean_85_cast_fp16")]; + tensor zero_mean_85_cast_fp16 = sub(x = inputs_85_cast_fp16, y = channels_mean_85_cast_fp16)[name = tensor("zero_mean_85_cast_fp16")]; + tensor zero_mean_sq_85_cast_fp16 = mul(x = zero_mean_85_cast_fp16, y = zero_mean_85_cast_fp16)[name = tensor("zero_mean_sq_85_cast_fp16")]; + tensor var_11029 = const()[name = tensor("op_11029"), val = tensor([1])]; + tensor var_11030_cast_fp16 = reduce_mean(axes = var_11029, keep_dims = var_10504, x = zero_mean_sq_85_cast_fp16)[name = tensor("op_11030_cast_fp16")]; + tensor var_11031_to_fp16 = const()[name = tensor("op_11031_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_11032_cast_fp16 = add(x = var_11030_cast_fp16, y = var_11031_to_fp16)[name = tensor("op_11032_cast_fp16")]; + tensor denom_85_epsilon_0_to_fp16 = const()[name = tensor("denom_85_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_85_cast_fp16 = rsqrt(epsilon = denom_85_epsilon_0_to_fp16, x = var_11032_cast_fp16)[name = tensor("denom_85_cast_fp16")]; + tensor out_85_cast_fp16 = mul(x = zero_mean_85_cast_fp16, y = denom_85_cast_fp16)[name = tensor("out_85_cast_fp16")]; + tensor var_11036_to_fp16 = const()[name = tensor("op_11036_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1714470464)))]; + tensor var_11037_cast_fp16 = add(x = out_85_cast_fp16, y = var_11036_to_fp16)[name = tensor("op_11037_cast_fp16")]; + tensor var_11039_to_fp16 = const()[name = tensor("op_11039_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1714471168)))]; + tensor hidden_states_307_cast_fp16 = mul(x = var_11037_cast_fp16, y = var_11039_to_fp16)[name = tensor("hidden_states_307_cast_fp16")]; + tensor var_11046 = const()[name = tensor("op_11046"), val = tensor([1, 1])]; + tensor var_11048 = const()[name = tensor("op_11048"), val = tensor([1, 1])]; + tensor q_57_pad_type_0 = const()[name = tensor("q_57_pad_type_0"), val = tensor("custom")]; + tensor q_57_pad_0 = const()[name = tensor("q_57_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1714471872)))]; + tensor q_57_cast_fp16 = conv(dilations = var_11048, groups = var_10509, pad = q_57_pad_0, pad_type = q_57_pad_type_0, strides = var_11046, weight = up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_307_cast_fp16)[name = tensor("q_57_cast_fp16")]; + tensor var_11052 = const()[name = tensor("op_11052"), val = tensor([1, 1])]; + tensor var_11054 = const()[name = tensor("op_11054"), val = tensor([1, 1])]; + tensor k_113_pad_type_0 = const()[name = tensor("k_113_pad_type_0"), val = tensor("custom")]; + tensor k_113_pad_0 = const()[name = tensor("k_113_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1714676736)))]; + tensor k_113_cast_fp16 = conv(dilations = var_11054, groups = var_10509, pad = k_113_pad_0, pad_type = k_113_pad_type_0, strides = var_11052, weight = up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_307_cast_fp16)[name = tensor("k_113_cast_fp16")]; + tensor var_11058 = const()[name = tensor("op_11058"), val = tensor([1, 1])]; + tensor var_11060 = const()[name = tensor("op_11060"), val = tensor([1, 1])]; + tensor v_57_pad_type_0 = const()[name = tensor("v_57_pad_type_0"), val = tensor("custom")]; + tensor v_57_pad_0 = const()[name = tensor("v_57_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1714881600)))]; + tensor v_57_cast_fp16 = conv(dilations = var_11060, groups = var_10509, pad = v_57_pad_0, pad_type = v_57_pad_type_0, strides = var_11058, weight = up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_307_cast_fp16)[name = tensor("v_57_cast_fp16")]; + tensor var_11064_begin_0 = const()[name = tensor("op_11064_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11064_end_0 = const()[name = tensor("op_11064_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_11064_end_mask_0 = const()[name = tensor("op_11064_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11064_cast_fp16 = slice_by_index(begin = var_11064_begin_0, end = var_11064_end_0, end_mask = var_11064_end_mask_0, x = q_57_cast_fp16)[name = tensor("op_11064_cast_fp16")]; + tensor var_11068_begin_0 = const()[name = tensor("op_11068_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_11068_end_0 = const()[name = tensor("op_11068_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_11068_end_mask_0 = const()[name = tensor("op_11068_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11068_cast_fp16 = slice_by_index(begin = var_11068_begin_0, end = var_11068_end_0, end_mask = var_11068_end_mask_0, x = q_57_cast_fp16)[name = tensor("op_11068_cast_fp16")]; + tensor var_11072_begin_0 = const()[name = tensor("op_11072_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_11072_end_0 = const()[name = tensor("op_11072_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_11072_end_mask_0 = const()[name = tensor("op_11072_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11072_cast_fp16 = slice_by_index(begin = var_11072_begin_0, end = var_11072_end_0, end_mask = var_11072_end_mask_0, x = q_57_cast_fp16)[name = tensor("op_11072_cast_fp16")]; + tensor var_11076_begin_0 = const()[name = tensor("op_11076_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_11076_end_0 = const()[name = tensor("op_11076_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_11076_end_mask_0 = const()[name = tensor("op_11076_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11076_cast_fp16 = slice_by_index(begin = var_11076_begin_0, end = var_11076_end_0, end_mask = var_11076_end_mask_0, x = q_57_cast_fp16)[name = tensor("op_11076_cast_fp16")]; + tensor var_11080_begin_0 = const()[name = tensor("op_11080_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_11080_end_0 = const()[name = tensor("op_11080_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_11080_end_mask_0 = const()[name = tensor("op_11080_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11080_cast_fp16 = slice_by_index(begin = var_11080_begin_0, end = var_11080_end_0, end_mask = var_11080_end_mask_0, x = q_57_cast_fp16)[name = tensor("op_11080_cast_fp16")]; + tensor k_115_perm_0 = const()[name = tensor("k_115_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_11087_begin_0 = const()[name = tensor("op_11087_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11087_end_0 = const()[name = tensor("op_11087_end_0"), val = tensor([2, 2304, 1, 64])]; + tensor var_11087_end_mask_0 = const()[name = tensor("op_11087_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_3 = transpose(perm = k_115_perm_0, x = k_113_cast_fp16)[name = tensor("transpose_3")]; + tensor var_11087_cast_fp16 = slice_by_index(begin = var_11087_begin_0, end = var_11087_end_0, end_mask = var_11087_end_mask_0, x = transpose_3)[name = tensor("op_11087_cast_fp16")]; + tensor var_11091_begin_0 = const()[name = tensor("op_11091_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_11091_end_0 = const()[name = tensor("op_11091_end_0"), val = tensor([2, 2304, 1, 128])]; + tensor var_11091_end_mask_0 = const()[name = tensor("op_11091_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11091_cast_fp16 = slice_by_index(begin = var_11091_begin_0, end = var_11091_end_0, end_mask = var_11091_end_mask_0, x = transpose_3)[name = tensor("op_11091_cast_fp16")]; + tensor var_11095_begin_0 = const()[name = tensor("op_11095_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_11095_end_0 = const()[name = tensor("op_11095_end_0"), val = tensor([2, 2304, 1, 192])]; + tensor var_11095_end_mask_0 = const()[name = tensor("op_11095_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11095_cast_fp16 = slice_by_index(begin = var_11095_begin_0, end = var_11095_end_0, end_mask = var_11095_end_mask_0, x = transpose_3)[name = tensor("op_11095_cast_fp16")]; + tensor var_11099_begin_0 = const()[name = tensor("op_11099_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_11099_end_0 = const()[name = tensor("op_11099_end_0"), val = tensor([2, 2304, 1, 256])]; + tensor var_11099_end_mask_0 = const()[name = tensor("op_11099_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11099_cast_fp16 = slice_by_index(begin = var_11099_begin_0, end = var_11099_end_0, end_mask = var_11099_end_mask_0, x = transpose_3)[name = tensor("op_11099_cast_fp16")]; + tensor var_11103_begin_0 = const()[name = tensor("op_11103_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_11103_end_0 = const()[name = tensor("op_11103_end_0"), val = tensor([2, 2304, 1, 320])]; + tensor var_11103_end_mask_0 = const()[name = tensor("op_11103_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11103_cast_fp16 = slice_by_index(begin = var_11103_begin_0, end = var_11103_end_0, end_mask = var_11103_end_mask_0, x = transpose_3)[name = tensor("op_11103_cast_fp16")]; + tensor var_11105_begin_0 = const()[name = tensor("op_11105_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11105_end_0 = const()[name = tensor("op_11105_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_11105_end_mask_0 = const()[name = tensor("op_11105_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11105_cast_fp16 = slice_by_index(begin = var_11105_begin_0, end = var_11105_end_0, end_mask = var_11105_end_mask_0, x = v_57_cast_fp16)[name = tensor("op_11105_cast_fp16")]; + tensor var_11109_begin_0 = const()[name = tensor("op_11109_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_11109_end_0 = const()[name = tensor("op_11109_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_11109_end_mask_0 = const()[name = tensor("op_11109_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11109_cast_fp16 = slice_by_index(begin = var_11109_begin_0, end = var_11109_end_0, end_mask = var_11109_end_mask_0, x = v_57_cast_fp16)[name = tensor("op_11109_cast_fp16")]; + tensor var_11113_begin_0 = const()[name = tensor("op_11113_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_11113_end_0 = const()[name = tensor("op_11113_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_11113_end_mask_0 = const()[name = tensor("op_11113_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11113_cast_fp16 = slice_by_index(begin = var_11113_begin_0, end = var_11113_end_0, end_mask = var_11113_end_mask_0, x = v_57_cast_fp16)[name = tensor("op_11113_cast_fp16")]; + tensor var_11117_begin_0 = const()[name = tensor("op_11117_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_11117_end_0 = const()[name = tensor("op_11117_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_11117_end_mask_0 = const()[name = tensor("op_11117_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11117_cast_fp16 = slice_by_index(begin = var_11117_begin_0, end = var_11117_end_0, end_mask = var_11117_end_mask_0, x = v_57_cast_fp16)[name = tensor("op_11117_cast_fp16")]; + tensor var_11121_begin_0 = const()[name = tensor("op_11121_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_11121_end_0 = const()[name = tensor("op_11121_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_11121_end_mask_0 = const()[name = tensor("op_11121_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11121_cast_fp16 = slice_by_index(begin = var_11121_begin_0, end = var_11121_end_0, end_mask = var_11121_end_mask_0, x = v_57_cast_fp16)[name = tensor("op_11121_cast_fp16")]; + tensor var_11125_equation_0 = const()[name = tensor("op_11125_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11125_cast_fp16 = einsum(equation = var_11125_equation_0, values = (var_11087_cast_fp16, var_11064_cast_fp16))[name = tensor("op_11125_cast_fp16")]; + tensor var_11126_to_fp16 = const()[name = tensor("op_11126_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_741_cast_fp16 = mul(x = var_11125_cast_fp16, y = var_11126_to_fp16)[name = tensor("aw_741_cast_fp16")]; + tensor var_11129_equation_0 = const()[name = tensor("op_11129_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11129_cast_fp16 = einsum(equation = var_11129_equation_0, values = (var_11091_cast_fp16, var_11068_cast_fp16))[name = tensor("op_11129_cast_fp16")]; + tensor var_11130_to_fp16 = const()[name = tensor("op_11130_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_743_cast_fp16 = mul(x = var_11129_cast_fp16, y = var_11130_to_fp16)[name = tensor("aw_743_cast_fp16")]; + tensor var_11133_equation_0 = const()[name = tensor("op_11133_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11133_cast_fp16 = einsum(equation = var_11133_equation_0, values = (var_11095_cast_fp16, var_11072_cast_fp16))[name = tensor("op_11133_cast_fp16")]; + tensor var_11134_to_fp16 = const()[name = tensor("op_11134_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_745_cast_fp16 = mul(x = var_11133_cast_fp16, y = var_11134_to_fp16)[name = tensor("aw_745_cast_fp16")]; + tensor var_11137_equation_0 = const()[name = tensor("op_11137_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11137_cast_fp16 = einsum(equation = var_11137_equation_0, values = (var_11099_cast_fp16, var_11076_cast_fp16))[name = tensor("op_11137_cast_fp16")]; + tensor var_11138_to_fp16 = const()[name = tensor("op_11138_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_747_cast_fp16 = mul(x = var_11137_cast_fp16, y = var_11138_to_fp16)[name = tensor("aw_747_cast_fp16")]; + tensor var_11141_equation_0 = const()[name = tensor("op_11141_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11141_cast_fp16 = einsum(equation = var_11141_equation_0, values = (var_11103_cast_fp16, var_11080_cast_fp16))[name = tensor("op_11141_cast_fp16")]; + tensor var_11142_to_fp16 = const()[name = tensor("op_11142_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_749_cast_fp16 = mul(x = var_11141_cast_fp16, y = var_11142_to_fp16)[name = tensor("aw_749_cast_fp16")]; + tensor var_11144_cast_fp16 = softmax(axis = var_10509, x = aw_741_cast_fp16)[name = tensor("op_11144_cast_fp16")]; + tensor var_11145_cast_fp16 = softmax(axis = var_10509, x = aw_743_cast_fp16)[name = tensor("op_11145_cast_fp16")]; + tensor var_11146_cast_fp16 = softmax(axis = var_10509, x = aw_745_cast_fp16)[name = tensor("op_11146_cast_fp16")]; + tensor var_11147_cast_fp16 = softmax(axis = var_10509, x = aw_747_cast_fp16)[name = tensor("op_11147_cast_fp16")]; + tensor var_11148_cast_fp16 = softmax(axis = var_10509, x = aw_749_cast_fp16)[name = tensor("op_11148_cast_fp16")]; + tensor var_11150_equation_0 = const()[name = tensor("op_11150_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11150_cast_fp16 = einsum(equation = var_11150_equation_0, values = (var_11105_cast_fp16, var_11144_cast_fp16))[name = tensor("op_11150_cast_fp16")]; + tensor var_11152_equation_0 = const()[name = tensor("op_11152_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11152_cast_fp16 = einsum(equation = var_11152_equation_0, values = (var_11109_cast_fp16, var_11145_cast_fp16))[name = tensor("op_11152_cast_fp16")]; + tensor var_11154_equation_0 = const()[name = tensor("op_11154_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11154_cast_fp16 = einsum(equation = var_11154_equation_0, values = (var_11113_cast_fp16, var_11146_cast_fp16))[name = tensor("op_11154_cast_fp16")]; + tensor var_11156_equation_0 = const()[name = tensor("op_11156_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11156_cast_fp16 = einsum(equation = var_11156_equation_0, values = (var_11117_cast_fp16, var_11147_cast_fp16))[name = tensor("op_11156_cast_fp16")]; + tensor var_11158_equation_0 = const()[name = tensor("op_11158_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11158_cast_fp16 = einsum(equation = var_11158_equation_0, values = (var_11121_cast_fp16, var_11148_cast_fp16))[name = tensor("op_11158_cast_fp16")]; + tensor input_491_interleave_0 = const()[name = tensor("input_491_interleave_0"), val = tensor(false)]; + tensor input_491_cast_fp16 = concat(axis = var_10509, interleave = input_491_interleave_0, values = (var_11150_cast_fp16, var_11152_cast_fp16, var_11154_cast_fp16, var_11156_cast_fp16, var_11158_cast_fp16))[name = tensor("input_491_cast_fp16")]; + tensor var_11164 = const()[name = tensor("op_11164"), val = tensor([1, 1])]; + tensor var_11166 = const()[name = tensor("op_11166"), val = tensor([1, 1])]; + tensor var_11168_pad_type_0 = const()[name = tensor("op_11168_pad_type_0"), val = tensor("custom")]; + tensor var_11168_pad_0 = const()[name = tensor("op_11168_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1715086464)))]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1715291328)))]; + tensor var_11168_cast_fp16 = conv(bias = up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_11166, groups = var_10509, pad = var_11168_pad_0, pad_type = var_11168_pad_type_0, strides = var_11164, weight = up_blocks_3_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_491_cast_fp16)[name = tensor("op_11168_cast_fp16")]; + tensor inputs_87_cast_fp16 = add(x = var_11168_cast_fp16, y = inputs_85_cast_fp16)[name = tensor("inputs_87_cast_fp16")]; + tensor var_11172 = const()[name = tensor("op_11172"), val = tensor([1])]; + tensor channels_mean_87_cast_fp16 = reduce_mean(axes = var_11172, keep_dims = var_10504, x = inputs_87_cast_fp16)[name = tensor("channels_mean_87_cast_fp16")]; + tensor zero_mean_87_cast_fp16 = sub(x = inputs_87_cast_fp16, y = channels_mean_87_cast_fp16)[name = tensor("zero_mean_87_cast_fp16")]; + tensor zero_mean_sq_87_cast_fp16 = mul(x = zero_mean_87_cast_fp16, y = zero_mean_87_cast_fp16)[name = tensor("zero_mean_sq_87_cast_fp16")]; + tensor var_11176 = const()[name = tensor("op_11176"), val = tensor([1])]; + tensor var_11177_cast_fp16 = reduce_mean(axes = var_11176, keep_dims = var_10504, x = zero_mean_sq_87_cast_fp16)[name = tensor("op_11177_cast_fp16")]; + tensor var_11178_to_fp16 = const()[name = tensor("op_11178_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_11179_cast_fp16 = add(x = var_11177_cast_fp16, y = var_11178_to_fp16)[name = tensor("op_11179_cast_fp16")]; + tensor denom_87_epsilon_0_to_fp16 = const()[name = tensor("denom_87_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_87_cast_fp16 = rsqrt(epsilon = denom_87_epsilon_0_to_fp16, x = var_11179_cast_fp16)[name = tensor("denom_87_cast_fp16")]; + tensor out_87_cast_fp16 = mul(x = zero_mean_87_cast_fp16, y = denom_87_cast_fp16)[name = tensor("out_87_cast_fp16")]; + tensor var_11183_to_fp16 = const()[name = tensor("op_11183_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1715292032)))]; + tensor var_11184_cast_fp16 = add(x = out_87_cast_fp16, y = var_11183_to_fp16)[name = tensor("op_11184_cast_fp16")]; + tensor var_11186_to_fp16 = const()[name = tensor("op_11186_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1715292736)))]; + tensor hidden_states_309_cast_fp16 = mul(x = var_11184_cast_fp16, y = var_11186_to_fp16)[name = tensor("hidden_states_309_cast_fp16")]; + tensor var_11193 = const()[name = tensor("op_11193"), val = tensor([1, 1])]; + tensor var_11195 = const()[name = tensor("op_11195"), val = tensor([1, 1])]; + tensor q_59_pad_type_0 = const()[name = tensor("q_59_pad_type_0"), val = tensor("custom")]; + tensor q_59_pad_0 = const()[name = tensor("q_59_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1715293440)))]; + tensor q_59_cast_fp16 = conv(dilations = var_11195, groups = var_10509, pad = q_59_pad_0, pad_type = q_59_pad_type_0, strides = var_11193, weight = up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_309_cast_fp16)[name = tensor("q_59_cast_fp16")]; + tensor var_11199 = const()[name = tensor("op_11199"), val = tensor([1, 1])]; + tensor var_11201 = const()[name = tensor("op_11201"), val = tensor([1, 1])]; + tensor k_117_pad_type_0 = const()[name = tensor("k_117_pad_type_0"), val = tensor("custom")]; + tensor k_117_pad_0 = const()[name = tensor("k_117_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1715498304)))]; + tensor k_117_cast_fp16 = conv(dilations = var_11201, groups = var_10509, pad = k_117_pad_0, pad_type = k_117_pad_type_0, strides = var_11199, weight = up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_117_cast_fp16")]; + tensor var_11205 = const()[name = tensor("op_11205"), val = tensor([1, 1])]; + tensor var_11207 = const()[name = tensor("op_11207"), val = tensor([1, 1])]; + tensor v_59_pad_type_0 = const()[name = tensor("v_59_pad_type_0"), val = tensor("custom")]; + tensor v_59_pad_0 = const()[name = tensor("v_59_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1716153728)))]; + tensor v_59_cast_fp16 = conv(dilations = var_11207, groups = var_10509, pad = v_59_pad_0, pad_type = v_59_pad_type_0, strides = var_11205, weight = up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_59_cast_fp16")]; + tensor var_11211_begin_0 = const()[name = tensor("op_11211_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11211_end_0 = const()[name = tensor("op_11211_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_11211_end_mask_0 = const()[name = tensor("op_11211_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11211_cast_fp16 = slice_by_index(begin = var_11211_begin_0, end = var_11211_end_0, end_mask = var_11211_end_mask_0, x = q_59_cast_fp16)[name = tensor("op_11211_cast_fp16")]; + tensor var_11215_begin_0 = const()[name = tensor("op_11215_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_11215_end_0 = const()[name = tensor("op_11215_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_11215_end_mask_0 = const()[name = tensor("op_11215_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11215_cast_fp16 = slice_by_index(begin = var_11215_begin_0, end = var_11215_end_0, end_mask = var_11215_end_mask_0, x = q_59_cast_fp16)[name = tensor("op_11215_cast_fp16")]; + tensor var_11219_begin_0 = const()[name = tensor("op_11219_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_11219_end_0 = const()[name = tensor("op_11219_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_11219_end_mask_0 = const()[name = tensor("op_11219_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11219_cast_fp16 = slice_by_index(begin = var_11219_begin_0, end = var_11219_end_0, end_mask = var_11219_end_mask_0, x = q_59_cast_fp16)[name = tensor("op_11219_cast_fp16")]; + tensor var_11223_begin_0 = const()[name = tensor("op_11223_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_11223_end_0 = const()[name = tensor("op_11223_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_11223_end_mask_0 = const()[name = tensor("op_11223_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11223_cast_fp16 = slice_by_index(begin = var_11223_begin_0, end = var_11223_end_0, end_mask = var_11223_end_mask_0, x = q_59_cast_fp16)[name = tensor("op_11223_cast_fp16")]; + tensor var_11227_begin_0 = const()[name = tensor("op_11227_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_11227_end_0 = const()[name = tensor("op_11227_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_11227_end_mask_0 = const()[name = tensor("op_11227_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11227_cast_fp16 = slice_by_index(begin = var_11227_begin_0, end = var_11227_end_0, end_mask = var_11227_end_mask_0, x = q_59_cast_fp16)[name = tensor("op_11227_cast_fp16")]; + tensor k_119_perm_0 = const()[name = tensor("k_119_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_11234_begin_0 = const()[name = tensor("op_11234_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11234_end_0 = const()[name = tensor("op_11234_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_11234_end_mask_0 = const()[name = tensor("op_11234_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_2 = transpose(perm = k_119_perm_0, x = k_117_cast_fp16)[name = tensor("transpose_2")]; + tensor var_11234_cast_fp16 = slice_by_index(begin = var_11234_begin_0, end = var_11234_end_0, end_mask = var_11234_end_mask_0, x = transpose_2)[name = tensor("op_11234_cast_fp16")]; + tensor var_11238_begin_0 = const()[name = tensor("op_11238_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_11238_end_0 = const()[name = tensor("op_11238_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_11238_end_mask_0 = const()[name = tensor("op_11238_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11238_cast_fp16 = slice_by_index(begin = var_11238_begin_0, end = var_11238_end_0, end_mask = var_11238_end_mask_0, x = transpose_2)[name = tensor("op_11238_cast_fp16")]; + tensor var_11242_begin_0 = const()[name = tensor("op_11242_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_11242_end_0 = const()[name = tensor("op_11242_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_11242_end_mask_0 = const()[name = tensor("op_11242_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11242_cast_fp16 = slice_by_index(begin = var_11242_begin_0, end = var_11242_end_0, end_mask = var_11242_end_mask_0, x = transpose_2)[name = tensor("op_11242_cast_fp16")]; + tensor var_11246_begin_0 = const()[name = tensor("op_11246_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_11246_end_0 = const()[name = tensor("op_11246_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_11246_end_mask_0 = const()[name = tensor("op_11246_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11246_cast_fp16 = slice_by_index(begin = var_11246_begin_0, end = var_11246_end_0, end_mask = var_11246_end_mask_0, x = transpose_2)[name = tensor("op_11246_cast_fp16")]; + tensor var_11250_begin_0 = const()[name = tensor("op_11250_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_11250_end_0 = const()[name = tensor("op_11250_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_11250_end_mask_0 = const()[name = tensor("op_11250_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11250_cast_fp16 = slice_by_index(begin = var_11250_begin_0, end = var_11250_end_0, end_mask = var_11250_end_mask_0, x = transpose_2)[name = tensor("op_11250_cast_fp16")]; + tensor var_11252_begin_0 = const()[name = tensor("op_11252_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11252_end_0 = const()[name = tensor("op_11252_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_11252_end_mask_0 = const()[name = tensor("op_11252_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11252_cast_fp16 = slice_by_index(begin = var_11252_begin_0, end = var_11252_end_0, end_mask = var_11252_end_mask_0, x = v_59_cast_fp16)[name = tensor("op_11252_cast_fp16")]; + tensor var_11256_begin_0 = const()[name = tensor("op_11256_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_11256_end_0 = const()[name = tensor("op_11256_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_11256_end_mask_0 = const()[name = tensor("op_11256_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11256_cast_fp16 = slice_by_index(begin = var_11256_begin_0, end = var_11256_end_0, end_mask = var_11256_end_mask_0, x = v_59_cast_fp16)[name = tensor("op_11256_cast_fp16")]; + tensor var_11260_begin_0 = const()[name = tensor("op_11260_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_11260_end_0 = const()[name = tensor("op_11260_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_11260_end_mask_0 = const()[name = tensor("op_11260_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11260_cast_fp16 = slice_by_index(begin = var_11260_begin_0, end = var_11260_end_0, end_mask = var_11260_end_mask_0, x = v_59_cast_fp16)[name = tensor("op_11260_cast_fp16")]; + tensor var_11264_begin_0 = const()[name = tensor("op_11264_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_11264_end_0 = const()[name = tensor("op_11264_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_11264_end_mask_0 = const()[name = tensor("op_11264_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11264_cast_fp16 = slice_by_index(begin = var_11264_begin_0, end = var_11264_end_0, end_mask = var_11264_end_mask_0, x = v_59_cast_fp16)[name = tensor("op_11264_cast_fp16")]; + tensor var_11268_begin_0 = const()[name = tensor("op_11268_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_11268_end_0 = const()[name = tensor("op_11268_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_11268_end_mask_0 = const()[name = tensor("op_11268_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11268_cast_fp16 = slice_by_index(begin = var_11268_begin_0, end = var_11268_end_0, end_mask = var_11268_end_mask_0, x = v_59_cast_fp16)[name = tensor("op_11268_cast_fp16")]; + tensor var_11272_equation_0 = const()[name = tensor("op_11272_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11272_cast_fp16 = einsum(equation = var_11272_equation_0, values = (var_11234_cast_fp16, var_11211_cast_fp16))[name = tensor("op_11272_cast_fp16")]; + tensor var_11273_to_fp16 = const()[name = tensor("op_11273_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_751_cast_fp16 = mul(x = var_11272_cast_fp16, y = var_11273_to_fp16)[name = tensor("aw_751_cast_fp16")]; + tensor var_11276_equation_0 = const()[name = tensor("op_11276_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11276_cast_fp16 = einsum(equation = var_11276_equation_0, values = (var_11238_cast_fp16, var_11215_cast_fp16))[name = tensor("op_11276_cast_fp16")]; + tensor var_11277_to_fp16 = const()[name = tensor("op_11277_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_753_cast_fp16 = mul(x = var_11276_cast_fp16, y = var_11277_to_fp16)[name = tensor("aw_753_cast_fp16")]; + tensor var_11280_equation_0 = const()[name = tensor("op_11280_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11280_cast_fp16 = einsum(equation = var_11280_equation_0, values = (var_11242_cast_fp16, var_11219_cast_fp16))[name = tensor("op_11280_cast_fp16")]; + tensor var_11281_to_fp16 = const()[name = tensor("op_11281_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_755_cast_fp16 = mul(x = var_11280_cast_fp16, y = var_11281_to_fp16)[name = tensor("aw_755_cast_fp16")]; + tensor var_11284_equation_0 = const()[name = tensor("op_11284_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11284_cast_fp16 = einsum(equation = var_11284_equation_0, values = (var_11246_cast_fp16, var_11223_cast_fp16))[name = tensor("op_11284_cast_fp16")]; + tensor var_11285_to_fp16 = const()[name = tensor("op_11285_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_757_cast_fp16 = mul(x = var_11284_cast_fp16, y = var_11285_to_fp16)[name = tensor("aw_757_cast_fp16")]; + tensor var_11288_equation_0 = const()[name = tensor("op_11288_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11288_cast_fp16 = einsum(equation = var_11288_equation_0, values = (var_11250_cast_fp16, var_11227_cast_fp16))[name = tensor("op_11288_cast_fp16")]; + tensor var_11289_to_fp16 = const()[name = tensor("op_11289_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_759_cast_fp16 = mul(x = var_11288_cast_fp16, y = var_11289_to_fp16)[name = tensor("aw_759_cast_fp16")]; + tensor var_11291_cast_fp16 = softmax(axis = var_10509, x = aw_751_cast_fp16)[name = tensor("op_11291_cast_fp16")]; + tensor var_11292_cast_fp16 = softmax(axis = var_10509, x = aw_753_cast_fp16)[name = tensor("op_11292_cast_fp16")]; + tensor var_11293_cast_fp16 = softmax(axis = var_10509, x = aw_755_cast_fp16)[name = tensor("op_11293_cast_fp16")]; + tensor var_11294_cast_fp16 = softmax(axis = var_10509, x = aw_757_cast_fp16)[name = tensor("op_11294_cast_fp16")]; + tensor var_11295_cast_fp16 = softmax(axis = var_10509, x = aw_759_cast_fp16)[name = tensor("op_11295_cast_fp16")]; + tensor var_11297_equation_0 = const()[name = tensor("op_11297_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11297_cast_fp16 = einsum(equation = var_11297_equation_0, values = (var_11252_cast_fp16, var_11291_cast_fp16))[name = tensor("op_11297_cast_fp16")]; + tensor var_11299_equation_0 = const()[name = tensor("op_11299_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11299_cast_fp16 = einsum(equation = var_11299_equation_0, values = (var_11256_cast_fp16, var_11292_cast_fp16))[name = tensor("op_11299_cast_fp16")]; + tensor var_11301_equation_0 = const()[name = tensor("op_11301_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11301_cast_fp16 = einsum(equation = var_11301_equation_0, values = (var_11260_cast_fp16, var_11293_cast_fp16))[name = tensor("op_11301_cast_fp16")]; + tensor var_11303_equation_0 = const()[name = tensor("op_11303_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11303_cast_fp16 = einsum(equation = var_11303_equation_0, values = (var_11264_cast_fp16, var_11294_cast_fp16))[name = tensor("op_11303_cast_fp16")]; + tensor var_11305_equation_0 = const()[name = tensor("op_11305_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11305_cast_fp16 = einsum(equation = var_11305_equation_0, values = (var_11268_cast_fp16, var_11295_cast_fp16))[name = tensor("op_11305_cast_fp16")]; + tensor input_493_interleave_0 = const()[name = tensor("input_493_interleave_0"), val = tensor(false)]; + tensor input_493_cast_fp16 = concat(axis = var_10509, interleave = input_493_interleave_0, values = (var_11297_cast_fp16, var_11299_cast_fp16, var_11301_cast_fp16, var_11303_cast_fp16, var_11305_cast_fp16))[name = tensor("input_493_cast_fp16")]; + tensor var_11311 = const()[name = tensor("op_11311"), val = tensor([1, 1])]; + tensor var_11313 = const()[name = tensor("op_11313"), val = tensor([1, 1])]; + tensor var_11315_pad_type_0 = const()[name = tensor("op_11315_pad_type_0"), val = tensor("custom")]; + tensor var_11315_pad_0 = const()[name = tensor("op_11315_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1716809152)))]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1717014016)))]; + tensor var_11315_cast_fp16 = conv(bias = up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_11313, groups = var_10509, pad = var_11315_pad_0, pad_type = var_11315_pad_type_0, strides = var_11311, weight = up_blocks_3_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_493_cast_fp16)[name = tensor("op_11315_cast_fp16")]; + tensor inputs_89_cast_fp16 = add(x = var_11315_cast_fp16, y = inputs_87_cast_fp16)[name = tensor("inputs_89_cast_fp16")]; + tensor var_11319 = const()[name = tensor("op_11319"), val = tensor([1])]; + tensor channels_mean_89_cast_fp16 = reduce_mean(axes = var_11319, keep_dims = var_10504, x = inputs_89_cast_fp16)[name = tensor("channels_mean_89_cast_fp16")]; + tensor zero_mean_89_cast_fp16 = sub(x = inputs_89_cast_fp16, y = channels_mean_89_cast_fp16)[name = tensor("zero_mean_89_cast_fp16")]; + tensor zero_mean_sq_89_cast_fp16 = mul(x = zero_mean_89_cast_fp16, y = zero_mean_89_cast_fp16)[name = tensor("zero_mean_sq_89_cast_fp16")]; + tensor var_11323 = const()[name = tensor("op_11323"), val = tensor([1])]; + tensor var_11324_cast_fp16 = reduce_mean(axes = var_11323, keep_dims = var_10504, x = zero_mean_sq_89_cast_fp16)[name = tensor("op_11324_cast_fp16")]; + tensor var_11325_to_fp16 = const()[name = tensor("op_11325_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_11326_cast_fp16 = add(x = var_11324_cast_fp16, y = var_11325_to_fp16)[name = tensor("op_11326_cast_fp16")]; + tensor denom_89_epsilon_0_to_fp16 = const()[name = tensor("denom_89_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_89_cast_fp16 = rsqrt(epsilon = denom_89_epsilon_0_to_fp16, x = var_11326_cast_fp16)[name = tensor("denom_89_cast_fp16")]; + tensor out_89_cast_fp16 = mul(x = zero_mean_89_cast_fp16, y = denom_89_cast_fp16)[name = tensor("out_89_cast_fp16")]; + tensor var_11330_to_fp16 = const()[name = tensor("op_11330_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1717014720)))]; + tensor var_11331_cast_fp16 = add(x = out_89_cast_fp16, y = var_11330_to_fp16)[name = tensor("op_11331_cast_fp16")]; + tensor var_11333_to_fp16 = const()[name = tensor("op_11333_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1717015424)))]; + tensor input_495_cast_fp16 = mul(x = var_11331_cast_fp16, y = var_11333_to_fp16)[name = tensor("input_495_cast_fp16")]; + tensor var_11341 = const()[name = tensor("op_11341"), val = tensor([1, 1])]; + tensor var_11343 = const()[name = tensor("op_11343"), val = tensor([1, 1])]; + tensor var_11345_pad_type_0 = const()[name = tensor("op_11345_pad_type_0"), val = tensor("custom")]; + tensor var_11345_pad_0 = const()[name = tensor("op_11345_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1717016128)))]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1718654592)))]; + tensor var_11345_cast_fp16 = conv(bias = up_blocks_3_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_11343, groups = var_10509, pad = var_11345_pad_0, pad_type = var_11345_pad_type_0, strides = var_11341, weight = up_blocks_3_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_495_cast_fp16)[name = tensor("op_11345_cast_fp16")]; + tensor var_11346_split_sizes_0 = const()[name = tensor("op_11346_split_sizes_0"), val = tensor([1280, 1280])]; + tensor var_11346_axis_0 = const()[name = tensor("op_11346_axis_0"), val = tensor(1)]; + tensor var_11346_cast_fp16_0, tensor var_11346_cast_fp16_1 = split(axis = var_11346_axis_0, split_sizes = var_11346_split_sizes_0, x = var_11345_cast_fp16)[name = tensor("op_11346_cast_fp16")]; + tensor var_11348_mode_0 = const()[name = tensor("op_11348_mode_0"), val = tensor("EXACT")]; + tensor var_11348_cast_fp16 = gelu(mode = var_11348_mode_0, x = var_11346_cast_fp16_1)[name = tensor("op_11348_cast_fp16")]; + tensor input_497_cast_fp16 = mul(x = var_11346_cast_fp16_0, y = var_11348_cast_fp16)[name = tensor("input_497_cast_fp16")]; + tensor var_11352 = const()[name = tensor("op_11352"), val = tensor([1, 1])]; + tensor var_11354 = const()[name = tensor("op_11354"), val = tensor([1, 1])]; + tensor var_11356_pad_type_0 = const()[name = tensor("op_11356_pad_type_0"), val = tensor("custom")]; + tensor var_11356_pad_0 = const()[name = tensor("op_11356_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1718659776)))]; + tensor up_blocks_3_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1719479040)))]; + tensor var_11356_cast_fp16 = conv(bias = up_blocks_3_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_11354, groups = var_10509, pad = var_11356_pad_0, pad_type = var_11356_pad_type_0, strides = var_11352, weight = up_blocks_3_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_497_cast_fp16)[name = tensor("op_11356_cast_fp16")]; + tensor hidden_states_313_cast_fp16 = add(x = var_11356_cast_fp16, y = inputs_89_cast_fp16)[name = tensor("hidden_states_313_cast_fp16")]; + tensor var_11358 = const()[name = tensor("op_11358"), val = tensor([2, 320, 48, 48])]; + tensor input_499_cast_fp16 = reshape(shape = var_11358, x = hidden_states_313_cast_fp16)[name = tensor("input_499_cast_fp16")]; + tensor var_11362 = const()[name = tensor("op_11362"), val = tensor([1, 1])]; + tensor var_11364 = const()[name = tensor("op_11364"), val = tensor([1, 1])]; + tensor hidden_states_315_pad_type_0 = const()[name = tensor("hidden_states_315_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_315_pad_0 = const()[name = tensor("hidden_states_315_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_1_proj_out_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1719479744)))]; + tensor up_blocks_3_attentions_1_proj_out_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_1_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1719684608)))]; + tensor hidden_states_315_cast_fp16 = conv(bias = up_blocks_3_attentions_1_proj_out_bias_to_fp16, dilations = var_11364, groups = var_10509, pad = hidden_states_315_pad_0, pad_type = hidden_states_315_pad_type_0, strides = var_11362, weight = up_blocks_3_attentions_1_proj_out_weight_to_fp16, x = input_499_cast_fp16)[name = tensor("hidden_states_315_cast_fp16")]; + tensor hidden_states_317_cast_fp16 = add(x = hidden_states_315_cast_fp16, y = hidden_states_303_cast_fp16)[name = tensor("hidden_states_317_cast_fp16")]; + tensor input_501_interleave_0 = const()[name = tensor("input_501_interleave_0"), val = tensor(false)]; + tensor input_501_cast_fp16 = concat(axis = var_10509, interleave = input_501_interleave_0, values = (hidden_states_317_cast_fp16, input_7_cast_fp16))[name = tensor("input_501_cast_fp16")]; + tensor reshape_228_shape_0 = const()[name = tensor("reshape_228_shape_0"), val = tensor([2, 32, 20, 48, 48])]; + tensor reshape_228_cast_fp16 = reshape(shape = reshape_228_shape_0, x = input_501_cast_fp16)[name = tensor("reshape_228_cast_fp16")]; + tensor reduce_mean_171_axes_0 = const()[name = tensor("reduce_mean_171_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_171_keep_dims_0 = const()[name = tensor("reduce_mean_171_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_171_cast_fp16 = reduce_mean(axes = reduce_mean_171_axes_0, keep_dims = reduce_mean_171_keep_dims_0, x = reshape_228_cast_fp16)[name = tensor("reduce_mean_171_cast_fp16")]; + tensor sub_114_cast_fp16 = sub(x = reshape_228_cast_fp16, y = reduce_mean_171_cast_fp16)[name = tensor("sub_114_cast_fp16")]; + tensor square_57_cast_fp16 = square(x = sub_114_cast_fp16)[name = tensor("square_57_cast_fp16")]; + tensor reduce_mean_173_axes_0 = const()[name = tensor("reduce_mean_173_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_173_keep_dims_0 = const()[name = tensor("reduce_mean_173_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_173_cast_fp16 = reduce_mean(axes = reduce_mean_173_axes_0, keep_dims = reduce_mean_173_keep_dims_0, x = square_57_cast_fp16)[name = tensor("reduce_mean_173_cast_fp16")]; + tensor add_114_y_0_to_fp16 = const()[name = tensor("add_114_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_114_cast_fp16 = add(x = reduce_mean_173_cast_fp16, y = add_114_y_0_to_fp16)[name = tensor("add_114_cast_fp16")]; + tensor sqrt_57_cast_fp16 = sqrt(x = add_114_cast_fp16)[name = tensor("sqrt_57_cast_fp16")]; + tensor real_div_57_cast_fp16 = real_div(x = sub_114_cast_fp16, y = sqrt_57_cast_fp16)[name = tensor("real_div_57_cast_fp16")]; + tensor reshape_229_shape_0 = const()[name = tensor("reshape_229_shape_0"), val = tensor([2, 640, 48, 48])]; + tensor reshape_229_cast_fp16 = reshape(shape = reshape_229_shape_0, x = real_div_57_cast_fp16)[name = tensor("reshape_229_cast_fp16")]; + tensor add_115_gamma_0_to_fp16 = const()[name = tensor("add_115_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1719685312)))]; + tensor add_115_beta_0_to_fp16 = const()[name = tensor("add_115_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1719686656)))]; + tensor add_115_epsilon_0_to_fp16 = const()[name = tensor("add_115_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_115_cast_fp16 = batch_norm(beta = add_115_beta_0_to_fp16, epsilon = add_115_epsilon_0_to_fp16, gamma = add_115_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_229_cast_fp16)[name = tensor("add_115_cast_fp16")]; + tensor input_505_cast_fp16 = silu(x = add_115_cast_fp16)[name = tensor("input_505_cast_fp16")]; + tensor var_11382 = const()[name = tensor("op_11382"), val = tensor([1, 1])]; + tensor var_11384 = const()[name = tensor("op_11384"), val = tensor([1, 1])]; + tensor hidden_states_319_pad_type_0 = const()[name = tensor("hidden_states_319_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_319_pad_0 = const()[name = tensor("hidden_states_319_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_3_resnets_2_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_2_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1719688000)))]; + tensor up_blocks_3_resnets_2_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_2_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1723374464)))]; + tensor hidden_states_319_cast_fp16 = conv(bias = up_blocks_3_resnets_2_conv1_bias_to_fp16, dilations = var_11384, groups = var_10509, pad = hidden_states_319_pad_0, pad_type = hidden_states_319_pad_type_0, strides = var_11382, weight = up_blocks_3_resnets_2_conv1_weight_to_fp16, x = input_505_cast_fp16)[name = tensor("hidden_states_319_cast_fp16")]; + tensor var_11390 = const()[name = tensor("op_11390"), val = tensor([1, 1])]; + tensor var_11392 = const()[name = tensor("op_11392"), val = tensor([1, 1])]; + tensor temb_pad_type_0 = const()[name = tensor("temb_pad_type_0"), val = tensor("custom")]; + tensor temb_pad_0 = const()[name = tensor("temb_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_resnets_2_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_2_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1723375168)))]; + tensor up_blocks_3_resnets_2_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_2_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1724194432)))]; + tensor temb_cast_fp16 = conv(bias = up_blocks_3_resnets_2_time_emb_proj_bias_to_fp16, dilations = var_11392, groups = var_10509, pad = temb_pad_0, pad_type = temb_pad_type_0, strides = var_11390, weight = up_blocks_3_resnets_2_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16)[name = tensor("temb_cast_fp16")]; + tensor input_509_cast_fp16 = add(x = hidden_states_319_cast_fp16, y = temb_cast_fp16)[name = tensor("input_509_cast_fp16")]; + tensor reshape_232_shape_0 = const()[name = tensor("reshape_232_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_232_cast_fp16 = reshape(shape = reshape_232_shape_0, x = input_509_cast_fp16)[name = tensor("reshape_232_cast_fp16")]; + tensor reduce_mean_174_axes_0 = const()[name = tensor("reduce_mean_174_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_174_keep_dims_0 = const()[name = tensor("reduce_mean_174_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_174_cast_fp16 = reduce_mean(axes = reduce_mean_174_axes_0, keep_dims = reduce_mean_174_keep_dims_0, x = reshape_232_cast_fp16)[name = tensor("reduce_mean_174_cast_fp16")]; + tensor sub_116_cast_fp16 = sub(x = reshape_232_cast_fp16, y = reduce_mean_174_cast_fp16)[name = tensor("sub_116_cast_fp16")]; + tensor square_58_cast_fp16 = square(x = sub_116_cast_fp16)[name = tensor("square_58_cast_fp16")]; + tensor reduce_mean_176_axes_0 = const()[name = tensor("reduce_mean_176_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_176_keep_dims_0 = const()[name = tensor("reduce_mean_176_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_176_cast_fp16 = reduce_mean(axes = reduce_mean_176_axes_0, keep_dims = reduce_mean_176_keep_dims_0, x = square_58_cast_fp16)[name = tensor("reduce_mean_176_cast_fp16")]; + tensor add_116_y_0_to_fp16 = const()[name = tensor("add_116_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_116_cast_fp16 = add(x = reduce_mean_176_cast_fp16, y = add_116_y_0_to_fp16)[name = tensor("add_116_cast_fp16")]; + tensor sqrt_58_cast_fp16 = sqrt(x = add_116_cast_fp16)[name = tensor("sqrt_58_cast_fp16")]; + tensor real_div_58_cast_fp16 = real_div(x = sub_116_cast_fp16, y = sqrt_58_cast_fp16)[name = tensor("real_div_58_cast_fp16")]; + tensor reshape_233_shape_0 = const()[name = tensor("reshape_233_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_233_cast_fp16 = reshape(shape = reshape_233_shape_0, x = real_div_58_cast_fp16)[name = tensor("reshape_233_cast_fp16")]; + tensor add_117_gamma_0_to_fp16 = const()[name = tensor("add_117_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1724195136)))]; + tensor add_117_beta_0_to_fp16 = const()[name = tensor("add_117_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1724195840)))]; + tensor add_117_epsilon_0_to_fp16 = const()[name = tensor("add_117_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_117_cast_fp16 = batch_norm(beta = add_117_beta_0_to_fp16, epsilon = add_117_epsilon_0_to_fp16, gamma = add_117_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_233_cast_fp16)[name = tensor("add_117_cast_fp16")]; + tensor input_513_cast_fp16 = silu(x = add_117_cast_fp16)[name = tensor("input_513_cast_fp16")]; + tensor var_11402 = const()[name = tensor("op_11402"), val = tensor([1, 1])]; + tensor var_11404 = const()[name = tensor("op_11404"), val = tensor([1, 1])]; + tensor hidden_states_321_pad_type_0 = const()[name = tensor("hidden_states_321_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_321_pad_0 = const()[name = tensor("hidden_states_321_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor up_blocks_3_resnets_2_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_2_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1724196544)))]; + tensor up_blocks_3_resnets_2_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_2_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1726039808)))]; + tensor hidden_states_321_cast_fp16 = conv(bias = up_blocks_3_resnets_2_conv2_bias_to_fp16, dilations = var_11404, groups = var_10509, pad = hidden_states_321_pad_0, pad_type = hidden_states_321_pad_type_0, strides = var_11402, weight = up_blocks_3_resnets_2_conv2_weight_to_fp16, x = input_513_cast_fp16)[name = tensor("hidden_states_321_cast_fp16")]; + tensor var_11409 = const()[name = tensor("op_11409"), val = tensor([1, 1])]; + tensor var_11411 = const()[name = tensor("op_11411"), val = tensor([1, 1])]; + tensor x_pad_type_0 = const()[name = tensor("x_pad_type_0"), val = tensor("custom")]; + tensor x_pad_0 = const()[name = tensor("x_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_resnets_2_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_3_resnets_2_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1726040512)))]; + tensor up_blocks_3_resnets_2_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_3_resnets_2_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1726450176)))]; + tensor x_cast_fp16 = conv(bias = up_blocks_3_resnets_2_conv_shortcut_bias_to_fp16, dilations = var_11411, groups = var_10509, pad = x_pad_0, pad_type = x_pad_type_0, strides = var_11409, weight = up_blocks_3_resnets_2_conv_shortcut_weight_to_fp16, x = input_501_cast_fp16)[name = tensor("x_cast_fp16")]; + tensor hidden_states_323_cast_fp16 = add(x = x_cast_fp16, y = hidden_states_321_cast_fp16)[name = tensor("hidden_states_323_cast_fp16")]; + tensor reshape_236_shape_0 = const()[name = tensor("reshape_236_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_236_cast_fp16 = reshape(shape = reshape_236_shape_0, x = hidden_states_323_cast_fp16)[name = tensor("reshape_236_cast_fp16")]; + tensor reduce_mean_177_axes_0 = const()[name = tensor("reduce_mean_177_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_177_keep_dims_0 = const()[name = tensor("reduce_mean_177_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_177_cast_fp16 = reduce_mean(axes = reduce_mean_177_axes_0, keep_dims = reduce_mean_177_keep_dims_0, x = reshape_236_cast_fp16)[name = tensor("reduce_mean_177_cast_fp16")]; + tensor sub_118_cast_fp16 = sub(x = reshape_236_cast_fp16, y = reduce_mean_177_cast_fp16)[name = tensor("sub_118_cast_fp16")]; + tensor square_59_cast_fp16 = square(x = sub_118_cast_fp16)[name = tensor("square_59_cast_fp16")]; + tensor reduce_mean_179_axes_0 = const()[name = tensor("reduce_mean_179_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_179_keep_dims_0 = const()[name = tensor("reduce_mean_179_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_179_cast_fp16 = reduce_mean(axes = reduce_mean_179_axes_0, keep_dims = reduce_mean_179_keep_dims_0, x = square_59_cast_fp16)[name = tensor("reduce_mean_179_cast_fp16")]; + tensor add_118_y_0_to_fp16 = const()[name = tensor("add_118_y_0_to_fp16"), val = tensor(0x1.1p-20)]; + tensor add_118_cast_fp16 = add(x = reduce_mean_179_cast_fp16, y = add_118_y_0_to_fp16)[name = tensor("add_118_cast_fp16")]; + tensor sqrt_59_cast_fp16 = sqrt(x = add_118_cast_fp16)[name = tensor("sqrt_59_cast_fp16")]; + tensor real_div_59_cast_fp16 = real_div(x = sub_118_cast_fp16, y = sqrt_59_cast_fp16)[name = tensor("real_div_59_cast_fp16")]; + tensor reshape_237_shape_0 = const()[name = tensor("reshape_237_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_237_cast_fp16 = reshape(shape = reshape_237_shape_0, x = real_div_59_cast_fp16)[name = tensor("reshape_237_cast_fp16")]; + tensor add_119_gamma_0_to_fp16 = const()[name = tensor("add_119_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1726450880)))]; + tensor add_119_beta_0_to_fp16 = const()[name = tensor("add_119_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1726451584)))]; + tensor add_119_epsilon_0_to_fp16 = const()[name = tensor("add_119_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_119_cast_fp16 = batch_norm(beta = add_119_beta_0_to_fp16, epsilon = add_119_epsilon_0_to_fp16, gamma = add_119_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_237_cast_fp16)[name = tensor("add_119_cast_fp16")]; + tensor var_11431 = const()[name = tensor("op_11431"), val = tensor([1, 1])]; + tensor var_11433 = const()[name = tensor("op_11433"), val = tensor([1, 1])]; + tensor hidden_states_325_pad_type_0 = const()[name = tensor("hidden_states_325_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_325_pad_0 = const()[name = tensor("hidden_states_325_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_proj_in_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1726452288)))]; + tensor up_blocks_3_attentions_2_proj_in_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1726657152)))]; + tensor hidden_states_325_cast_fp16 = conv(bias = up_blocks_3_attentions_2_proj_in_bias_to_fp16, dilations = var_11433, groups = var_10509, pad = hidden_states_325_pad_0, pad_type = hidden_states_325_pad_type_0, strides = var_11431, weight = up_blocks_3_attentions_2_proj_in_weight_to_fp16, x = add_119_cast_fp16)[name = tensor("hidden_states_325_cast_fp16")]; + tensor var_11438 = const()[name = tensor("op_11438"), val = tensor([2, 320, 1, 2304])]; + tensor inputs_91_cast_fp16 = reshape(shape = var_11438, x = hidden_states_325_cast_fp16)[name = tensor("inputs_91_cast_fp16")]; + tensor var_11448 = const()[name = tensor("op_11448"), val = tensor([1])]; + tensor channels_mean_91_cast_fp16 = reduce_mean(axes = var_11448, keep_dims = var_10504, x = inputs_91_cast_fp16)[name = tensor("channels_mean_91_cast_fp16")]; + tensor zero_mean_91_cast_fp16 = sub(x = inputs_91_cast_fp16, y = channels_mean_91_cast_fp16)[name = tensor("zero_mean_91_cast_fp16")]; + tensor zero_mean_sq_91_cast_fp16 = mul(x = zero_mean_91_cast_fp16, y = zero_mean_91_cast_fp16)[name = tensor("zero_mean_sq_91_cast_fp16")]; + tensor var_11452 = const()[name = tensor("op_11452"), val = tensor([1])]; + tensor var_11453_cast_fp16 = reduce_mean(axes = var_11452, keep_dims = var_10504, x = zero_mean_sq_91_cast_fp16)[name = tensor("op_11453_cast_fp16")]; + tensor var_11454_to_fp16 = const()[name = tensor("op_11454_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_11455_cast_fp16 = add(x = var_11453_cast_fp16, y = var_11454_to_fp16)[name = tensor("op_11455_cast_fp16")]; + tensor denom_91_epsilon_0_to_fp16 = const()[name = tensor("denom_91_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_91_cast_fp16 = rsqrt(epsilon = denom_91_epsilon_0_to_fp16, x = var_11455_cast_fp16)[name = tensor("denom_91_cast_fp16")]; + tensor out_91_cast_fp16 = mul(x = zero_mean_91_cast_fp16, y = denom_91_cast_fp16)[name = tensor("out_91_cast_fp16")]; + tensor var_11459_to_fp16 = const()[name = tensor("op_11459_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1726657856)))]; + tensor var_11460_cast_fp16 = add(x = out_91_cast_fp16, y = var_11459_to_fp16)[name = tensor("op_11460_cast_fp16")]; + tensor var_11462_to_fp16 = const()[name = tensor("op_11462_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1726658560)))]; + tensor hidden_states_327_cast_fp16 = mul(x = var_11460_cast_fp16, y = var_11462_to_fp16)[name = tensor("hidden_states_327_cast_fp16")]; + tensor var_11469 = const()[name = tensor("op_11469"), val = tensor([1, 1])]; + tensor var_11471 = const()[name = tensor("op_11471"), val = tensor([1, 1])]; + tensor q_61_pad_type_0 = const()[name = tensor("q_61_pad_type_0"), val = tensor("custom")]; + tensor q_61_pad_0 = const()[name = tensor("q_61_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1726659264)))]; + tensor q_61_cast_fp16 = conv(dilations = var_11471, groups = var_10509, pad = q_61_pad_0, pad_type = q_61_pad_type_0, strides = var_11469, weight = up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_327_cast_fp16)[name = tensor("q_61_cast_fp16")]; + tensor var_11475 = const()[name = tensor("op_11475"), val = tensor([1, 1])]; + tensor var_11477 = const()[name = tensor("op_11477"), val = tensor([1, 1])]; + tensor k_121_pad_type_0 = const()[name = tensor("k_121_pad_type_0"), val = tensor("custom")]; + tensor k_121_pad_0 = const()[name = tensor("k_121_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1726864128)))]; + tensor k_121_cast_fp16 = conv(dilations = var_11477, groups = var_10509, pad = k_121_pad_0, pad_type = k_121_pad_type_0, strides = var_11475, weight = up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_327_cast_fp16)[name = tensor("k_121_cast_fp16")]; + tensor var_11481 = const()[name = tensor("op_11481"), val = tensor([1, 1])]; + tensor var_11483 = const()[name = tensor("op_11483"), val = tensor([1, 1])]; + tensor v_61_pad_type_0 = const()[name = tensor("v_61_pad_type_0"), val = tensor("custom")]; + tensor v_61_pad_0 = const()[name = tensor("v_61_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1727068992)))]; + tensor v_61_cast_fp16 = conv(dilations = var_11483, groups = var_10509, pad = v_61_pad_0, pad_type = v_61_pad_type_0, strides = var_11481, weight = up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_327_cast_fp16)[name = tensor("v_61_cast_fp16")]; + tensor var_11487_begin_0 = const()[name = tensor("op_11487_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11487_end_0 = const()[name = tensor("op_11487_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_11487_end_mask_0 = const()[name = tensor("op_11487_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11487_cast_fp16 = slice_by_index(begin = var_11487_begin_0, end = var_11487_end_0, end_mask = var_11487_end_mask_0, x = q_61_cast_fp16)[name = tensor("op_11487_cast_fp16")]; + tensor var_11491_begin_0 = const()[name = tensor("op_11491_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_11491_end_0 = const()[name = tensor("op_11491_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_11491_end_mask_0 = const()[name = tensor("op_11491_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11491_cast_fp16 = slice_by_index(begin = var_11491_begin_0, end = var_11491_end_0, end_mask = var_11491_end_mask_0, x = q_61_cast_fp16)[name = tensor("op_11491_cast_fp16")]; + tensor var_11495_begin_0 = const()[name = tensor("op_11495_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_11495_end_0 = const()[name = tensor("op_11495_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_11495_end_mask_0 = const()[name = tensor("op_11495_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11495_cast_fp16 = slice_by_index(begin = var_11495_begin_0, end = var_11495_end_0, end_mask = var_11495_end_mask_0, x = q_61_cast_fp16)[name = tensor("op_11495_cast_fp16")]; + tensor var_11499_begin_0 = const()[name = tensor("op_11499_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_11499_end_0 = const()[name = tensor("op_11499_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_11499_end_mask_0 = const()[name = tensor("op_11499_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11499_cast_fp16 = slice_by_index(begin = var_11499_begin_0, end = var_11499_end_0, end_mask = var_11499_end_mask_0, x = q_61_cast_fp16)[name = tensor("op_11499_cast_fp16")]; + tensor var_11503_begin_0 = const()[name = tensor("op_11503_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_11503_end_0 = const()[name = tensor("op_11503_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_11503_end_mask_0 = const()[name = tensor("op_11503_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11503_cast_fp16 = slice_by_index(begin = var_11503_begin_0, end = var_11503_end_0, end_mask = var_11503_end_mask_0, x = q_61_cast_fp16)[name = tensor("op_11503_cast_fp16")]; + tensor k_123_perm_0 = const()[name = tensor("k_123_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_11510_begin_0 = const()[name = tensor("op_11510_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11510_end_0 = const()[name = tensor("op_11510_end_0"), val = tensor([2, 2304, 1, 64])]; + tensor var_11510_end_mask_0 = const()[name = tensor("op_11510_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_1 = transpose(perm = k_123_perm_0, x = k_121_cast_fp16)[name = tensor("transpose_1")]; + tensor var_11510_cast_fp16 = slice_by_index(begin = var_11510_begin_0, end = var_11510_end_0, end_mask = var_11510_end_mask_0, x = transpose_1)[name = tensor("op_11510_cast_fp16")]; + tensor var_11514_begin_0 = const()[name = tensor("op_11514_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_11514_end_0 = const()[name = tensor("op_11514_end_0"), val = tensor([2, 2304, 1, 128])]; + tensor var_11514_end_mask_0 = const()[name = tensor("op_11514_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11514_cast_fp16 = slice_by_index(begin = var_11514_begin_0, end = var_11514_end_0, end_mask = var_11514_end_mask_0, x = transpose_1)[name = tensor("op_11514_cast_fp16")]; + tensor var_11518_begin_0 = const()[name = tensor("op_11518_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_11518_end_0 = const()[name = tensor("op_11518_end_0"), val = tensor([2, 2304, 1, 192])]; + tensor var_11518_end_mask_0 = const()[name = tensor("op_11518_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11518_cast_fp16 = slice_by_index(begin = var_11518_begin_0, end = var_11518_end_0, end_mask = var_11518_end_mask_0, x = transpose_1)[name = tensor("op_11518_cast_fp16")]; + tensor var_11522_begin_0 = const()[name = tensor("op_11522_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_11522_end_0 = const()[name = tensor("op_11522_end_0"), val = tensor([2, 2304, 1, 256])]; + tensor var_11522_end_mask_0 = const()[name = tensor("op_11522_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11522_cast_fp16 = slice_by_index(begin = var_11522_begin_0, end = var_11522_end_0, end_mask = var_11522_end_mask_0, x = transpose_1)[name = tensor("op_11522_cast_fp16")]; + tensor var_11526_begin_0 = const()[name = tensor("op_11526_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_11526_end_0 = const()[name = tensor("op_11526_end_0"), val = tensor([2, 2304, 1, 320])]; + tensor var_11526_end_mask_0 = const()[name = tensor("op_11526_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11526_cast_fp16 = slice_by_index(begin = var_11526_begin_0, end = var_11526_end_0, end_mask = var_11526_end_mask_0, x = transpose_1)[name = tensor("op_11526_cast_fp16")]; + tensor var_11528_begin_0 = const()[name = tensor("op_11528_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11528_end_0 = const()[name = tensor("op_11528_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_11528_end_mask_0 = const()[name = tensor("op_11528_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11528_cast_fp16 = slice_by_index(begin = var_11528_begin_0, end = var_11528_end_0, end_mask = var_11528_end_mask_0, x = v_61_cast_fp16)[name = tensor("op_11528_cast_fp16")]; + tensor var_11532_begin_0 = const()[name = tensor("op_11532_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_11532_end_0 = const()[name = tensor("op_11532_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_11532_end_mask_0 = const()[name = tensor("op_11532_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11532_cast_fp16 = slice_by_index(begin = var_11532_begin_0, end = var_11532_end_0, end_mask = var_11532_end_mask_0, x = v_61_cast_fp16)[name = tensor("op_11532_cast_fp16")]; + tensor var_11536_begin_0 = const()[name = tensor("op_11536_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_11536_end_0 = const()[name = tensor("op_11536_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_11536_end_mask_0 = const()[name = tensor("op_11536_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11536_cast_fp16 = slice_by_index(begin = var_11536_begin_0, end = var_11536_end_0, end_mask = var_11536_end_mask_0, x = v_61_cast_fp16)[name = tensor("op_11536_cast_fp16")]; + tensor var_11540_begin_0 = const()[name = tensor("op_11540_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_11540_end_0 = const()[name = tensor("op_11540_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_11540_end_mask_0 = const()[name = tensor("op_11540_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11540_cast_fp16 = slice_by_index(begin = var_11540_begin_0, end = var_11540_end_0, end_mask = var_11540_end_mask_0, x = v_61_cast_fp16)[name = tensor("op_11540_cast_fp16")]; + tensor var_11544_begin_0 = const()[name = tensor("op_11544_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_11544_end_0 = const()[name = tensor("op_11544_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_11544_end_mask_0 = const()[name = tensor("op_11544_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11544_cast_fp16 = slice_by_index(begin = var_11544_begin_0, end = var_11544_end_0, end_mask = var_11544_end_mask_0, x = v_61_cast_fp16)[name = tensor("op_11544_cast_fp16")]; + tensor var_11548_equation_0 = const()[name = tensor("op_11548_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11548_cast_fp16 = einsum(equation = var_11548_equation_0, values = (var_11510_cast_fp16, var_11487_cast_fp16))[name = tensor("op_11548_cast_fp16")]; + tensor var_11549_to_fp16 = const()[name = tensor("op_11549_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_761_cast_fp16 = mul(x = var_11548_cast_fp16, y = var_11549_to_fp16)[name = tensor("aw_761_cast_fp16")]; + tensor var_11552_equation_0 = const()[name = tensor("op_11552_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11552_cast_fp16 = einsum(equation = var_11552_equation_0, values = (var_11514_cast_fp16, var_11491_cast_fp16))[name = tensor("op_11552_cast_fp16")]; + tensor var_11553_to_fp16 = const()[name = tensor("op_11553_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_763_cast_fp16 = mul(x = var_11552_cast_fp16, y = var_11553_to_fp16)[name = tensor("aw_763_cast_fp16")]; + tensor var_11556_equation_0 = const()[name = tensor("op_11556_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11556_cast_fp16 = einsum(equation = var_11556_equation_0, values = (var_11518_cast_fp16, var_11495_cast_fp16))[name = tensor("op_11556_cast_fp16")]; + tensor var_11557_to_fp16 = const()[name = tensor("op_11557_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_765_cast_fp16 = mul(x = var_11556_cast_fp16, y = var_11557_to_fp16)[name = tensor("aw_765_cast_fp16")]; + tensor var_11560_equation_0 = const()[name = tensor("op_11560_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11560_cast_fp16 = einsum(equation = var_11560_equation_0, values = (var_11522_cast_fp16, var_11499_cast_fp16))[name = tensor("op_11560_cast_fp16")]; + tensor var_11561_to_fp16 = const()[name = tensor("op_11561_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_767_cast_fp16 = mul(x = var_11560_cast_fp16, y = var_11561_to_fp16)[name = tensor("aw_767_cast_fp16")]; + tensor var_11564_equation_0 = const()[name = tensor("op_11564_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11564_cast_fp16 = einsum(equation = var_11564_equation_0, values = (var_11526_cast_fp16, var_11503_cast_fp16))[name = tensor("op_11564_cast_fp16")]; + tensor var_11565_to_fp16 = const()[name = tensor("op_11565_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_769_cast_fp16 = mul(x = var_11564_cast_fp16, y = var_11565_to_fp16)[name = tensor("aw_769_cast_fp16")]; + tensor var_11567_cast_fp16 = softmax(axis = var_10509, x = aw_761_cast_fp16)[name = tensor("op_11567_cast_fp16")]; + tensor var_11568_cast_fp16 = softmax(axis = var_10509, x = aw_763_cast_fp16)[name = tensor("op_11568_cast_fp16")]; + tensor var_11569_cast_fp16 = softmax(axis = var_10509, x = aw_765_cast_fp16)[name = tensor("op_11569_cast_fp16")]; + tensor var_11570_cast_fp16 = softmax(axis = var_10509, x = aw_767_cast_fp16)[name = tensor("op_11570_cast_fp16")]; + tensor var_11571_cast_fp16 = softmax(axis = var_10509, x = aw_769_cast_fp16)[name = tensor("op_11571_cast_fp16")]; + tensor var_11573_equation_0 = const()[name = tensor("op_11573_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11573_cast_fp16 = einsum(equation = var_11573_equation_0, values = (var_11528_cast_fp16, var_11567_cast_fp16))[name = tensor("op_11573_cast_fp16")]; + tensor var_11575_equation_0 = const()[name = tensor("op_11575_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11575_cast_fp16 = einsum(equation = var_11575_equation_0, values = (var_11532_cast_fp16, var_11568_cast_fp16))[name = tensor("op_11575_cast_fp16")]; + tensor var_11577_equation_0 = const()[name = tensor("op_11577_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11577_cast_fp16 = einsum(equation = var_11577_equation_0, values = (var_11536_cast_fp16, var_11569_cast_fp16))[name = tensor("op_11577_cast_fp16")]; + tensor var_11579_equation_0 = const()[name = tensor("op_11579_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11579_cast_fp16 = einsum(equation = var_11579_equation_0, values = (var_11540_cast_fp16, var_11570_cast_fp16))[name = tensor("op_11579_cast_fp16")]; + tensor var_11581_equation_0 = const()[name = tensor("op_11581_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11581_cast_fp16 = einsum(equation = var_11581_equation_0, values = (var_11544_cast_fp16, var_11571_cast_fp16))[name = tensor("op_11581_cast_fp16")]; + tensor input_517_interleave_0 = const()[name = tensor("input_517_interleave_0"), val = tensor(false)]; + tensor input_517_cast_fp16 = concat(axis = var_10509, interleave = input_517_interleave_0, values = (var_11573_cast_fp16, var_11575_cast_fp16, var_11577_cast_fp16, var_11579_cast_fp16, var_11581_cast_fp16))[name = tensor("input_517_cast_fp16")]; + tensor var_11587 = const()[name = tensor("op_11587"), val = tensor([1, 1])]; + tensor var_11589 = const()[name = tensor("op_11589"), val = tensor([1, 1])]; + tensor var_11591_pad_type_0 = const()[name = tensor("op_11591_pad_type_0"), val = tensor("custom")]; + tensor var_11591_pad_0 = const()[name = tensor("op_11591_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1727273856)))]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1727478720)))]; + tensor var_11591_cast_fp16 = conv(bias = up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_11589, groups = var_10509, pad = var_11591_pad_0, pad_type = var_11591_pad_type_0, strides = var_11587, weight = up_blocks_3_attentions_2_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_517_cast_fp16)[name = tensor("op_11591_cast_fp16")]; + tensor inputs_93_cast_fp16 = add(x = var_11591_cast_fp16, y = inputs_91_cast_fp16)[name = tensor("inputs_93_cast_fp16")]; + tensor var_11595 = const()[name = tensor("op_11595"), val = tensor([1])]; + tensor channels_mean_93_cast_fp16 = reduce_mean(axes = var_11595, keep_dims = var_10504, x = inputs_93_cast_fp16)[name = tensor("channels_mean_93_cast_fp16")]; + tensor zero_mean_93_cast_fp16 = sub(x = inputs_93_cast_fp16, y = channels_mean_93_cast_fp16)[name = tensor("zero_mean_93_cast_fp16")]; + tensor zero_mean_sq_93_cast_fp16 = mul(x = zero_mean_93_cast_fp16, y = zero_mean_93_cast_fp16)[name = tensor("zero_mean_sq_93_cast_fp16")]; + tensor var_11599 = const()[name = tensor("op_11599"), val = tensor([1])]; + tensor var_11600_cast_fp16 = reduce_mean(axes = var_11599, keep_dims = var_10504, x = zero_mean_sq_93_cast_fp16)[name = tensor("op_11600_cast_fp16")]; + tensor var_11601_to_fp16 = const()[name = tensor("op_11601_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_11602_cast_fp16 = add(x = var_11600_cast_fp16, y = var_11601_to_fp16)[name = tensor("op_11602_cast_fp16")]; + tensor denom_93_epsilon_0_to_fp16 = const()[name = tensor("denom_93_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_93_cast_fp16 = rsqrt(epsilon = denom_93_epsilon_0_to_fp16, x = var_11602_cast_fp16)[name = tensor("denom_93_cast_fp16")]; + tensor out_93_cast_fp16 = mul(x = zero_mean_93_cast_fp16, y = denom_93_cast_fp16)[name = tensor("out_93_cast_fp16")]; + tensor var_11606_to_fp16 = const()[name = tensor("op_11606_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1727479424)))]; + tensor var_11607_cast_fp16 = add(x = out_93_cast_fp16, y = var_11606_to_fp16)[name = tensor("op_11607_cast_fp16")]; + tensor var_11609_to_fp16 = const()[name = tensor("op_11609_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1727480128)))]; + tensor hidden_states_329_cast_fp16 = mul(x = var_11607_cast_fp16, y = var_11609_to_fp16)[name = tensor("hidden_states_329_cast_fp16")]; + tensor var_11616 = const()[name = tensor("op_11616"), val = tensor([1, 1])]; + tensor var_11618 = const()[name = tensor("op_11618"), val = tensor([1, 1])]; + tensor q_pad_type_0 = const()[name = tensor("q_pad_type_0"), val = tensor("custom")]; + tensor q_pad_0 = const()[name = tensor("q_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1727480832)))]; + tensor q_cast_fp16 = conv(dilations = var_11618, groups = var_10509, pad = q_pad_0, pad_type = q_pad_type_0, strides = var_11616, weight = up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_329_cast_fp16)[name = tensor("q_cast_fp16")]; + tensor var_11622 = const()[name = tensor("op_11622"), val = tensor([1, 1])]; + tensor var_11624 = const()[name = tensor("op_11624"), val = tensor([1, 1])]; + tensor k_125_pad_type_0 = const()[name = tensor("k_125_pad_type_0"), val = tensor("custom")]; + tensor k_125_pad_0 = const()[name = tensor("k_125_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1727685696)))]; + tensor k_125_cast_fp16 = conv(dilations = var_11624, groups = var_10509, pad = k_125_pad_0, pad_type = k_125_pad_type_0, strides = var_11622, weight = up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_125_cast_fp16")]; + tensor var_11628 = const()[name = tensor("op_11628"), val = tensor([1, 1])]; + tensor var_11630 = const()[name = tensor("op_11630"), val = tensor([1, 1])]; + tensor v_pad_type_0 = const()[name = tensor("v_pad_type_0"), val = tensor("custom")]; + tensor v_pad_0 = const()[name = tensor("v_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1728341120)))]; + tensor v_cast_fp16 = conv(dilations = var_11630, groups = var_10509, pad = v_pad_0, pad_type = v_pad_type_0, strides = var_11628, weight = up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_cast_fp16")]; + tensor var_11634_begin_0 = const()[name = tensor("op_11634_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11634_end_0 = const()[name = tensor("op_11634_end_0"), val = tensor([2, 64, 1, 2304])]; + tensor var_11634_end_mask_0 = const()[name = tensor("op_11634_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11634_cast_fp16 = slice_by_index(begin = var_11634_begin_0, end = var_11634_end_0, end_mask = var_11634_end_mask_0, x = q_cast_fp16)[name = tensor("op_11634_cast_fp16")]; + tensor var_11638_begin_0 = const()[name = tensor("op_11638_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_11638_end_0 = const()[name = tensor("op_11638_end_0"), val = tensor([2, 128, 1, 2304])]; + tensor var_11638_end_mask_0 = const()[name = tensor("op_11638_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11638_cast_fp16 = slice_by_index(begin = var_11638_begin_0, end = var_11638_end_0, end_mask = var_11638_end_mask_0, x = q_cast_fp16)[name = tensor("op_11638_cast_fp16")]; + tensor var_11642_begin_0 = const()[name = tensor("op_11642_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_11642_end_0 = const()[name = tensor("op_11642_end_0"), val = tensor([2, 192, 1, 2304])]; + tensor var_11642_end_mask_0 = const()[name = tensor("op_11642_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11642_cast_fp16 = slice_by_index(begin = var_11642_begin_0, end = var_11642_end_0, end_mask = var_11642_end_mask_0, x = q_cast_fp16)[name = tensor("op_11642_cast_fp16")]; + tensor var_11646_begin_0 = const()[name = tensor("op_11646_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_11646_end_0 = const()[name = tensor("op_11646_end_0"), val = tensor([2, 256, 1, 2304])]; + tensor var_11646_end_mask_0 = const()[name = tensor("op_11646_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11646_cast_fp16 = slice_by_index(begin = var_11646_begin_0, end = var_11646_end_0, end_mask = var_11646_end_mask_0, x = q_cast_fp16)[name = tensor("op_11646_cast_fp16")]; + tensor var_11650_begin_0 = const()[name = tensor("op_11650_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_11650_end_0 = const()[name = tensor("op_11650_end_0"), val = tensor([2, 320, 1, 2304])]; + tensor var_11650_end_mask_0 = const()[name = tensor("op_11650_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11650_cast_fp16 = slice_by_index(begin = var_11650_begin_0, end = var_11650_end_0, end_mask = var_11650_end_mask_0, x = q_cast_fp16)[name = tensor("op_11650_cast_fp16")]; + tensor k_perm_0 = const()[name = tensor("k_perm_0"), val = tensor([0, 3, 2, 1])]; + tensor var_11657_begin_0 = const()[name = tensor("op_11657_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11657_end_0 = const()[name = tensor("op_11657_end_0"), val = tensor([2, 77, 1, 64])]; + tensor var_11657_end_mask_0 = const()[name = tensor("op_11657_end_mask_0"), val = tensor([true, true, true, false])]; + tensor transpose_0 = transpose(perm = k_perm_0, x = k_125_cast_fp16)[name = tensor("transpose_0")]; + tensor var_11657_cast_fp16 = slice_by_index(begin = var_11657_begin_0, end = var_11657_end_0, end_mask = var_11657_end_mask_0, x = transpose_0)[name = tensor("op_11657_cast_fp16")]; + tensor var_11661_begin_0 = const()[name = tensor("op_11661_begin_0"), val = tensor([0, 0, 0, 64])]; + tensor var_11661_end_0 = const()[name = tensor("op_11661_end_0"), val = tensor([2, 77, 1, 128])]; + tensor var_11661_end_mask_0 = const()[name = tensor("op_11661_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11661_cast_fp16 = slice_by_index(begin = var_11661_begin_0, end = var_11661_end_0, end_mask = var_11661_end_mask_0, x = transpose_0)[name = tensor("op_11661_cast_fp16")]; + tensor var_11665_begin_0 = const()[name = tensor("op_11665_begin_0"), val = tensor([0, 0, 0, 128])]; + tensor var_11665_end_0 = const()[name = tensor("op_11665_end_0"), val = tensor([2, 77, 1, 192])]; + tensor var_11665_end_mask_0 = const()[name = tensor("op_11665_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11665_cast_fp16 = slice_by_index(begin = var_11665_begin_0, end = var_11665_end_0, end_mask = var_11665_end_mask_0, x = transpose_0)[name = tensor("op_11665_cast_fp16")]; + tensor var_11669_begin_0 = const()[name = tensor("op_11669_begin_0"), val = tensor([0, 0, 0, 192])]; + tensor var_11669_end_0 = const()[name = tensor("op_11669_end_0"), val = tensor([2, 77, 1, 256])]; + tensor var_11669_end_mask_0 = const()[name = tensor("op_11669_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11669_cast_fp16 = slice_by_index(begin = var_11669_begin_0, end = var_11669_end_0, end_mask = var_11669_end_mask_0, x = transpose_0)[name = tensor("op_11669_cast_fp16")]; + tensor var_11673_begin_0 = const()[name = tensor("op_11673_begin_0"), val = tensor([0, 0, 0, 256])]; + tensor var_11673_end_0 = const()[name = tensor("op_11673_end_0"), val = tensor([2, 77, 1, 320])]; + tensor var_11673_end_mask_0 = const()[name = tensor("op_11673_end_mask_0"), val = tensor([true, true, true, false])]; + tensor var_11673_cast_fp16 = slice_by_index(begin = var_11673_begin_0, end = var_11673_end_0, end_mask = var_11673_end_mask_0, x = transpose_0)[name = tensor("op_11673_cast_fp16")]; + tensor var_11675_begin_0 = const()[name = tensor("op_11675_begin_0"), val = tensor([0, 0, 0, 0])]; + tensor var_11675_end_0 = const()[name = tensor("op_11675_end_0"), val = tensor([2, 64, 1, 77])]; + tensor var_11675_end_mask_0 = const()[name = tensor("op_11675_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11675_cast_fp16 = slice_by_index(begin = var_11675_begin_0, end = var_11675_end_0, end_mask = var_11675_end_mask_0, x = v_cast_fp16)[name = tensor("op_11675_cast_fp16")]; + tensor var_11679_begin_0 = const()[name = tensor("op_11679_begin_0"), val = tensor([0, 64, 0, 0])]; + tensor var_11679_end_0 = const()[name = tensor("op_11679_end_0"), val = tensor([2, 128, 1, 77])]; + tensor var_11679_end_mask_0 = const()[name = tensor("op_11679_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11679_cast_fp16 = slice_by_index(begin = var_11679_begin_0, end = var_11679_end_0, end_mask = var_11679_end_mask_0, x = v_cast_fp16)[name = tensor("op_11679_cast_fp16")]; + tensor var_11683_begin_0 = const()[name = tensor("op_11683_begin_0"), val = tensor([0, 128, 0, 0])]; + tensor var_11683_end_0 = const()[name = tensor("op_11683_end_0"), val = tensor([2, 192, 1, 77])]; + tensor var_11683_end_mask_0 = const()[name = tensor("op_11683_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11683_cast_fp16 = slice_by_index(begin = var_11683_begin_0, end = var_11683_end_0, end_mask = var_11683_end_mask_0, x = v_cast_fp16)[name = tensor("op_11683_cast_fp16")]; + tensor var_11687_begin_0 = const()[name = tensor("op_11687_begin_0"), val = tensor([0, 192, 0, 0])]; + tensor var_11687_end_0 = const()[name = tensor("op_11687_end_0"), val = tensor([2, 256, 1, 77])]; + tensor var_11687_end_mask_0 = const()[name = tensor("op_11687_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11687_cast_fp16 = slice_by_index(begin = var_11687_begin_0, end = var_11687_end_0, end_mask = var_11687_end_mask_0, x = v_cast_fp16)[name = tensor("op_11687_cast_fp16")]; + tensor var_11691_begin_0 = const()[name = tensor("op_11691_begin_0"), val = tensor([0, 256, 0, 0])]; + tensor var_11691_end_0 = const()[name = tensor("op_11691_end_0"), val = tensor([2, 320, 1, 77])]; + tensor var_11691_end_mask_0 = const()[name = tensor("op_11691_end_mask_0"), val = tensor([true, false, true, true])]; + tensor var_11691_cast_fp16 = slice_by_index(begin = var_11691_begin_0, end = var_11691_end_0, end_mask = var_11691_end_mask_0, x = v_cast_fp16)[name = tensor("op_11691_cast_fp16")]; + tensor var_11695_equation_0 = const()[name = tensor("op_11695_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11695_cast_fp16 = einsum(equation = var_11695_equation_0, values = (var_11657_cast_fp16, var_11634_cast_fp16))[name = tensor("op_11695_cast_fp16")]; + tensor var_11696_to_fp16 = const()[name = tensor("op_11696_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_771_cast_fp16 = mul(x = var_11695_cast_fp16, y = var_11696_to_fp16)[name = tensor("aw_771_cast_fp16")]; + tensor var_11699_equation_0 = const()[name = tensor("op_11699_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11699_cast_fp16 = einsum(equation = var_11699_equation_0, values = (var_11661_cast_fp16, var_11638_cast_fp16))[name = tensor("op_11699_cast_fp16")]; + tensor var_11700_to_fp16 = const()[name = tensor("op_11700_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_773_cast_fp16 = mul(x = var_11699_cast_fp16, y = var_11700_to_fp16)[name = tensor("aw_773_cast_fp16")]; + tensor var_11703_equation_0 = const()[name = tensor("op_11703_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11703_cast_fp16 = einsum(equation = var_11703_equation_0, values = (var_11665_cast_fp16, var_11642_cast_fp16))[name = tensor("op_11703_cast_fp16")]; + tensor var_11704_to_fp16 = const()[name = tensor("op_11704_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_775_cast_fp16 = mul(x = var_11703_cast_fp16, y = var_11704_to_fp16)[name = tensor("aw_775_cast_fp16")]; + tensor var_11707_equation_0 = const()[name = tensor("op_11707_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11707_cast_fp16 = einsum(equation = var_11707_equation_0, values = (var_11669_cast_fp16, var_11646_cast_fp16))[name = tensor("op_11707_cast_fp16")]; + tensor var_11708_to_fp16 = const()[name = tensor("op_11708_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_777_cast_fp16 = mul(x = var_11707_cast_fp16, y = var_11708_to_fp16)[name = tensor("aw_777_cast_fp16")]; + tensor var_11711_equation_0 = const()[name = tensor("op_11711_equation_0"), val = tensor("bkhc,bchq->bkhq")]; + tensor var_11711_cast_fp16 = einsum(equation = var_11711_equation_0, values = (var_11673_cast_fp16, var_11650_cast_fp16))[name = tensor("op_11711_cast_fp16")]; + tensor var_11712_to_fp16 = const()[name = tensor("op_11712_to_fp16"), val = tensor(0x1p-3)]; + tensor aw_cast_fp16 = mul(x = var_11711_cast_fp16, y = var_11712_to_fp16)[name = tensor("aw_cast_fp16")]; + tensor var_11714_cast_fp16 = softmax(axis = var_10509, x = aw_771_cast_fp16)[name = tensor("op_11714_cast_fp16")]; + tensor var_11715_cast_fp16 = softmax(axis = var_10509, x = aw_773_cast_fp16)[name = tensor("op_11715_cast_fp16")]; + tensor var_11716_cast_fp16 = softmax(axis = var_10509, x = aw_775_cast_fp16)[name = tensor("op_11716_cast_fp16")]; + tensor var_11717_cast_fp16 = softmax(axis = var_10509, x = aw_777_cast_fp16)[name = tensor("op_11717_cast_fp16")]; + tensor var_11718_cast_fp16 = softmax(axis = var_10509, x = aw_cast_fp16)[name = tensor("op_11718_cast_fp16")]; + tensor var_11720_equation_0 = const()[name = tensor("op_11720_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11720_cast_fp16 = einsum(equation = var_11720_equation_0, values = (var_11675_cast_fp16, var_11714_cast_fp16))[name = tensor("op_11720_cast_fp16")]; + tensor var_11722_equation_0 = const()[name = tensor("op_11722_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11722_cast_fp16 = einsum(equation = var_11722_equation_0, values = (var_11679_cast_fp16, var_11715_cast_fp16))[name = tensor("op_11722_cast_fp16")]; + tensor var_11724_equation_0 = const()[name = tensor("op_11724_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11724_cast_fp16 = einsum(equation = var_11724_equation_0, values = (var_11683_cast_fp16, var_11716_cast_fp16))[name = tensor("op_11724_cast_fp16")]; + tensor var_11726_equation_0 = const()[name = tensor("op_11726_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11726_cast_fp16 = einsum(equation = var_11726_equation_0, values = (var_11687_cast_fp16, var_11717_cast_fp16))[name = tensor("op_11726_cast_fp16")]; + tensor var_11728_equation_0 = const()[name = tensor("op_11728_equation_0"), val = tensor("bchk,bkhq->bchq")]; + tensor var_11728_cast_fp16 = einsum(equation = var_11728_equation_0, values = (var_11691_cast_fp16, var_11718_cast_fp16))[name = tensor("op_11728_cast_fp16")]; + tensor input_519_interleave_0 = const()[name = tensor("input_519_interleave_0"), val = tensor(false)]; + tensor input_519_cast_fp16 = concat(axis = var_10509, interleave = input_519_interleave_0, values = (var_11720_cast_fp16, var_11722_cast_fp16, var_11724_cast_fp16, var_11726_cast_fp16, var_11728_cast_fp16))[name = tensor("input_519_cast_fp16")]; + tensor var_11734 = const()[name = tensor("op_11734"), val = tensor([1, 1])]; + tensor var_11736 = const()[name = tensor("op_11736"), val = tensor([1, 1])]; + tensor var_11738_pad_type_0 = const()[name = tensor("op_11738_pad_type_0"), val = tensor("custom")]; + tensor var_11738_pad_0 = const()[name = tensor("op_11738_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1728996544)))]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1729201408)))]; + tensor var_11738_cast_fp16 = conv(bias = up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_11736, groups = var_10509, pad = var_11738_pad_0, pad_type = var_11738_pad_type_0, strides = var_11734, weight = up_blocks_3_attentions_2_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_519_cast_fp16)[name = tensor("op_11738_cast_fp16")]; + tensor inputs_cast_fp16 = add(x = var_11738_cast_fp16, y = inputs_93_cast_fp16)[name = tensor("inputs_cast_fp16")]; + tensor var_11742 = const()[name = tensor("op_11742"), val = tensor([1])]; + tensor channels_mean_cast_fp16 = reduce_mean(axes = var_11742, keep_dims = var_10504, x = inputs_cast_fp16)[name = tensor("channels_mean_cast_fp16")]; + tensor zero_mean_cast_fp16 = sub(x = inputs_cast_fp16, y = channels_mean_cast_fp16)[name = tensor("zero_mean_cast_fp16")]; + tensor zero_mean_sq_cast_fp16 = mul(x = zero_mean_cast_fp16, y = zero_mean_cast_fp16)[name = tensor("zero_mean_sq_cast_fp16")]; + tensor var_11746 = const()[name = tensor("op_11746"), val = tensor([1])]; + tensor var_11747_cast_fp16 = reduce_mean(axes = var_11746, keep_dims = var_10504, x = zero_mean_sq_cast_fp16)[name = tensor("op_11747_cast_fp16")]; + tensor var_11748_to_fp16 = const()[name = tensor("op_11748_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_11749_cast_fp16 = add(x = var_11747_cast_fp16, y = var_11748_to_fp16)[name = tensor("op_11749_cast_fp16")]; + tensor denom_epsilon_0_to_fp16 = const()[name = tensor("denom_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; + tensor denom_cast_fp16 = rsqrt(epsilon = denom_epsilon_0_to_fp16, x = var_11749_cast_fp16)[name = tensor("denom_cast_fp16")]; + tensor out_cast_fp16 = mul(x = zero_mean_cast_fp16, y = denom_cast_fp16)[name = tensor("out_cast_fp16")]; + tensor var_11753_to_fp16 = const()[name = tensor("op_11753_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1729202112)))]; + tensor var_11754_cast_fp16 = add(x = out_cast_fp16, y = var_11753_to_fp16)[name = tensor("op_11754_cast_fp16")]; + tensor var_11756_to_fp16 = const()[name = tensor("op_11756_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1729202816)))]; + tensor input_521_cast_fp16 = mul(x = var_11754_cast_fp16, y = var_11756_to_fp16)[name = tensor("input_521_cast_fp16")]; + tensor var_11764 = const()[name = tensor("op_11764"), val = tensor([1, 1])]; + tensor var_11766 = const()[name = tensor("op_11766"), val = tensor([1, 1])]; + tensor var_11768_pad_type_0 = const()[name = tensor("op_11768_pad_type_0"), val = tensor("custom")]; + tensor var_11768_pad_0 = const()[name = tensor("op_11768_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1729203520)))]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1730841984)))]; + tensor var_11768_cast_fp16 = conv(bias = up_blocks_3_attentions_2_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_11766, groups = var_10509, pad = var_11768_pad_0, pad_type = var_11768_pad_type_0, strides = var_11764, weight = up_blocks_3_attentions_2_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_521_cast_fp16)[name = tensor("op_11768_cast_fp16")]; + tensor var_11769_split_sizes_0 = const()[name = tensor("op_11769_split_sizes_0"), val = tensor([1280, 1280])]; + tensor var_11769_axis_0 = const()[name = tensor("op_11769_axis_0"), val = tensor(1)]; + tensor var_11769_cast_fp16_0, tensor var_11769_cast_fp16_1 = split(axis = var_11769_axis_0, split_sizes = var_11769_split_sizes_0, x = var_11768_cast_fp16)[name = tensor("op_11769_cast_fp16")]; + tensor var_11771_mode_0 = const()[name = tensor("op_11771_mode_0"), val = tensor("EXACT")]; + tensor var_11771_cast_fp16 = gelu(mode = var_11771_mode_0, x = var_11769_cast_fp16_1)[name = tensor("op_11771_cast_fp16")]; + tensor input_523_cast_fp16 = mul(x = var_11769_cast_fp16_0, y = var_11771_cast_fp16)[name = tensor("input_523_cast_fp16")]; + tensor var_11775 = const()[name = tensor("op_11775"), val = tensor([1, 1])]; + tensor var_11777 = const()[name = tensor("op_11777"), val = tensor([1, 1])]; + tensor var_11779_pad_type_0 = const()[name = tensor("op_11779_pad_type_0"), val = tensor("custom")]; + tensor var_11779_pad_0 = const()[name = tensor("op_11779_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1730847168)))]; + tensor up_blocks_3_attentions_2_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1731666432)))]; + tensor var_11779_cast_fp16 = conv(bias = up_blocks_3_attentions_2_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_11777, groups = var_10509, pad = var_11779_pad_0, pad_type = var_11779_pad_type_0, strides = var_11775, weight = up_blocks_3_attentions_2_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_523_cast_fp16)[name = tensor("op_11779_cast_fp16")]; + tensor hidden_states_333_cast_fp16 = add(x = var_11779_cast_fp16, y = inputs_cast_fp16)[name = tensor("hidden_states_333_cast_fp16")]; + tensor var_11781 = const()[name = tensor("op_11781"), val = tensor([2, 320, 48, 48])]; + tensor input_525_cast_fp16 = reshape(shape = var_11781, x = hidden_states_333_cast_fp16)[name = tensor("input_525_cast_fp16")]; + tensor var_11785 = const()[name = tensor("op_11785"), val = tensor([1, 1])]; + tensor var_11787 = const()[name = tensor("op_11787"), val = tensor([1, 1])]; + tensor hidden_states_pad_type_0 = const()[name = tensor("hidden_states_pad_type_0"), val = tensor("custom")]; + tensor hidden_states_pad_0 = const()[name = tensor("hidden_states_pad_0"), val = tensor([0, 0, 0, 0])]; + tensor up_blocks_3_attentions_2_proj_out_weight_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1731667136)))]; + tensor up_blocks_3_attentions_2_proj_out_bias_to_fp16 = const()[name = tensor("up_blocks_3_attentions_2_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1731872000)))]; + tensor hidden_states_cast_fp16 = conv(bias = up_blocks_3_attentions_2_proj_out_bias_to_fp16, dilations = var_11787, groups = var_10509, pad = hidden_states_pad_0, pad_type = hidden_states_pad_type_0, strides = var_11785, weight = up_blocks_3_attentions_2_proj_out_weight_to_fp16, x = input_525_cast_fp16)[name = tensor("hidden_states_cast_fp16")]; + tensor input_527_cast_fp16 = add(x = hidden_states_cast_fp16, y = hidden_states_323_cast_fp16)[name = tensor("input_527_cast_fp16")]; + tensor reshape_240_shape_0 = const()[name = tensor("reshape_240_shape_0"), val = tensor([2, 32, 10, 48, 48])]; + tensor reshape_240_cast_fp16 = reshape(shape = reshape_240_shape_0, x = input_527_cast_fp16)[name = tensor("reshape_240_cast_fp16")]; + tensor reduce_mean_180_axes_0 = const()[name = tensor("reduce_mean_180_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_180_keep_dims_0 = const()[name = tensor("reduce_mean_180_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_180_cast_fp16 = reduce_mean(axes = reduce_mean_180_axes_0, keep_dims = reduce_mean_180_keep_dims_0, x = reshape_240_cast_fp16)[name = tensor("reduce_mean_180_cast_fp16")]; + tensor sub_120_cast_fp16 = sub(x = reshape_240_cast_fp16, y = reduce_mean_180_cast_fp16)[name = tensor("sub_120_cast_fp16")]; + tensor square_60_cast_fp16 = square(x = sub_120_cast_fp16)[name = tensor("square_60_cast_fp16")]; + tensor reduce_mean_182_axes_0 = const()[name = tensor("reduce_mean_182_axes_0"), val = tensor([2, 3, 4])]; + tensor reduce_mean_182_keep_dims_0 = const()[name = tensor("reduce_mean_182_keep_dims_0"), val = tensor(true)]; + tensor reduce_mean_182_cast_fp16 = reduce_mean(axes = reduce_mean_182_axes_0, keep_dims = reduce_mean_182_keep_dims_0, x = square_60_cast_fp16)[name = tensor("reduce_mean_182_cast_fp16")]; + tensor add_120_y_0_to_fp16 = const()[name = tensor("add_120_y_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_120_cast_fp16 = add(x = reduce_mean_182_cast_fp16, y = add_120_y_0_to_fp16)[name = tensor("add_120_cast_fp16")]; + tensor sqrt_60_cast_fp16 = sqrt(x = add_120_cast_fp16)[name = tensor("sqrt_60_cast_fp16")]; + tensor real_div_60_cast_fp16 = real_div(x = sub_120_cast_fp16, y = sqrt_60_cast_fp16)[name = tensor("real_div_60_cast_fp16")]; + tensor reshape_241_shape_0 = const()[name = tensor("reshape_241_shape_0"), val = tensor([2, 320, 48, 48])]; + tensor reshape_241_cast_fp16 = reshape(shape = reshape_241_shape_0, x = real_div_60_cast_fp16)[name = tensor("reshape_241_cast_fp16")]; + tensor add_121_gamma_0_to_fp16 = const()[name = tensor("add_121_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1731872704)))]; + tensor add_121_beta_0_to_fp16 = const()[name = tensor("add_121_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1731873408)))]; + tensor add_121_epsilon_0_to_fp16 = const()[name = tensor("add_121_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; + tensor add_121_cast_fp16 = batch_norm(beta = add_121_beta_0_to_fp16, epsilon = add_121_epsilon_0_to_fp16, gamma = add_121_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_241_cast_fp16)[name = tensor("add_121_cast_fp16")]; + tensor input_cast_fp16 = silu(x = add_121_cast_fp16)[name = tensor("input_cast_fp16")]; + tensor var_11801 = const()[name = tensor("op_11801"), val = tensor(1)]; + tensor var_11804 = const()[name = tensor("op_11804"), val = tensor([1, 1])]; + tensor var_11806 = const()[name = tensor("op_11806"), val = tensor([1, 1])]; + tensor var_11808_pad_type_0 = const()[name = tensor("op_11808_pad_type_0"), val = tensor("custom")]; + tensor var_11808_pad_0 = const()[name = tensor("op_11808_pad_0"), val = tensor([1, 1, 1, 1])]; + tensor conv_out_weight_to_fp16 = const()[name = tensor("conv_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1731874112)))]; + tensor conv_out_bias_to_fp16 = const()[name = tensor("conv_out_bias_to_fp16"), val = tensor([-0x1.4b4p-9, 0x1.6f4p-9, 0x1.9ap-12, 0x1.04p-9])]; + tensor var_11808_cast_fp16 = conv(bias = conv_out_bias_to_fp16, dilations = var_11806, groups = var_11801, pad = var_11808_pad_0, pad_type = var_11808_pad_type_0, strides = var_11804, weight = conv_out_weight_to_fp16, x = input_cast_fp16)[name = tensor("op_11808_cast_fp16")]; + tensor var_11808_cast_fp16_to_fp32_dtype_0 = const()[name = tensor("op_11808_cast_fp16_to_fp32_dtype_0"), val = tensor("fp32")]; + tensor noise_pred = cast(dtype = var_11808_cast_fp16_to_fp32_dtype_0, x = var_11808_cast_fp16)[name = tensor("cast_133")]; + } -> (noise_pred); +} \ No newline at end of file