program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "5.33.5"}, {"coremlc-version", "1877.40.3"}, {"coremltools-component-milinternal", ""}, {"coremltools-version", "7.1"}})] { func main(tensor encoder_hidden_states, tensor sample, tensor timestep) { tensor var_25 = const()[name = tensor("op_25"), val = tensor(-1)]; tensor var_42_axes_0 = const()[name = tensor("op_42_axes_0"), val = tensor([1])]; tensor var_42_cast_fp16 = expand_dims(axes = var_42_axes_0, x = timestep)[name = tensor("op_42_cast_fp16")]; tensor var_44_to_fp16 = const()[name = tensor("op_44_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor emb_3_cast_fp16 = mul(x = var_42_cast_fp16, y = var_44_to_fp16)[name = tensor("emb_3_cast_fp16")]; tensor var_49_cast_fp16 = sin(x = emb_3_cast_fp16)[name = tensor("op_49_cast_fp16")]; tensor var_50_cast_fp16 = cos(x = emb_3_cast_fp16)[name = tensor("op_50_cast_fp16")]; tensor emb_interleave_0 = const()[name = tensor("emb_interleave_0"), val = tensor(false)]; tensor emb_cast_fp16 = concat(axis = var_25, interleave = emb_interleave_0, values = (var_49_cast_fp16, var_50_cast_fp16))[name = tensor("emb_cast_fp16")]; tensor var_54_begin_0 = const()[name = tensor("op_54_begin_0"), val = tensor([0, 160])]; tensor var_54_end_0 = const()[name = tensor("op_54_end_0"), val = tensor([2, 320])]; tensor var_54_end_mask_0 = const()[name = tensor("op_54_end_mask_0"), val = tensor([true, true])]; tensor var_54_cast_fp16 = slice_by_index(begin = var_54_begin_0, end = var_54_end_0, end_mask = var_54_end_mask_0, x = emb_cast_fp16)[name = tensor("op_54_cast_fp16")]; tensor var_56_begin_0 = const()[name = tensor("op_56_begin_0"), val = tensor([0, 0])]; tensor var_56_end_0 = const()[name = tensor("op_56_end_0"), val = tensor([2, 160])]; tensor var_56_end_mask_0 = const()[name = tensor("op_56_end_mask_0"), val = tensor([true, false])]; tensor var_56_cast_fp16 = slice_by_index(begin = var_56_begin_0, end = var_56_end_0, end_mask = var_56_end_mask_0, x = emb_cast_fp16)[name = tensor("op_56_cast_fp16")]; tensor sample_interleave_0 = const()[name = tensor("sample_interleave_0"), val = tensor(false)]; tensor sample_cast_fp16 = concat(axis = var_25, interleave = sample_interleave_0, values = (var_54_cast_fp16, var_56_cast_fp16))[name = tensor("sample_cast_fp16")]; tensor var_59 = const()[name = tensor("op_59"), val = tensor(1)]; tensor var_66_axes_0 = const()[name = tensor("op_66_axes_0"), val = tensor([-1])]; tensor var_66_cast_fp16 = expand_dims(axes = var_66_axes_0, x = sample_cast_fp16)[name = tensor("op_66_cast_fp16")]; tensor input_1_axes_0 = const()[name = tensor("input_1_axes_0"), val = tensor([-1])]; tensor input_1_cast_fp16 = expand_dims(axes = input_1_axes_0, x = var_66_cast_fp16)[name = tensor("input_1_cast_fp16")]; tensor var_70 = const()[name = tensor("op_70"), val = tensor([1, 1])]; tensor var_72 = const()[name = tensor("op_72"), val = tensor([1, 1])]; tensor input_3_pad_type_0 = const()[name = tensor("input_3_pad_type_0"), val = tensor("custom")]; tensor input_3_pad_0 = const()[name = tensor("input_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor time_embedding_linear_1_weight_to_fp16 = const()[name = tensor("time_embedding_linear_1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(448)))]; tensor time_embedding_linear_1_bias_to_fp16 = const()[name = tensor("time_embedding_linear_1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(819712)))]; tensor input_3_cast_fp16 = conv(bias = time_embedding_linear_1_bias_to_fp16, dilations = var_72, groups = var_59, pad = input_3_pad_0, pad_type = input_3_pad_type_0, strides = var_70, weight = time_embedding_linear_1_weight_to_fp16, x = input_1_cast_fp16)[name = tensor("input_3_cast_fp16")]; tensor input_5_cast_fp16 = silu(x = input_3_cast_fp16)[name = tensor("input_5_cast_fp16")]; tensor var_78 = const()[name = tensor("op_78"), val = tensor([1, 1])]; tensor var_80 = const()[name = tensor("op_80"), val = tensor([1, 1])]; tensor input_13_pad_type_0 = const()[name = tensor("input_13_pad_type_0"), val = tensor("custom")]; tensor input_13_pad_0 = const()[name = tensor("input_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor time_embedding_linear_2_weight_to_fp16 = const()[name = tensor("time_embedding_linear_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(822336)))]; tensor time_embedding_linear_2_bias_to_fp16 = const()[name = tensor("time_embedding_linear_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4099200)))]; tensor input_13_cast_fp16 = conv(bias = time_embedding_linear_2_bias_to_fp16, dilations = var_80, groups = var_59, pad = input_13_pad_0, pad_type = input_13_pad_type_0, strides = var_78, weight = time_embedding_linear_2_weight_to_fp16, x = input_5_cast_fp16)[name = tensor("input_13_cast_fp16")]; tensor var_86 = const()[name = tensor("op_86"), val = tensor(1)]; tensor var_89 = const()[name = tensor("op_89"), val = tensor([1, 1])]; tensor var_91 = const()[name = tensor("op_91"), val = tensor([1, 1])]; tensor input_7_pad_type_0 = const()[name = tensor("input_7_pad_type_0"), val = tensor("custom")]; tensor input_7_pad_0 = const()[name = tensor("input_7_pad_0"), val = tensor([1, 1, 1, 1])]; tensor conv_in_weight_to_fp16 = const()[name = tensor("conv_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4101824)))]; tensor conv_in_bias_to_fp16 = const()[name = tensor("conv_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4124928)))]; tensor input_7_cast_fp16_1 = conv(bias = conv_in_bias_to_fp16, dilations = var_91, groups = var_86, pad = input_7_pad_0, pad_type = input_7_pad_type_0, strides = var_89, weight = conv_in_weight_to_fp16, x = sample)[name = tensor("input_7_cast_fp16")]; tensor var_107 = const()[name = tensor("op_107"), val = tensor(true)]; tensor var_112 = const()[name = tensor("op_112"), val = tensor(1)]; tensor reshape_0_shape_0 = const()[name = tensor("reshape_0_shape_0"), val = tensor([2, 32, 10, 48, 48])]; tensor reshape_0_cast_fp16 = reshape(shape = reshape_0_shape_0, x = input_7_cast_fp16_1)[name = tensor("reshape_0_cast_fp16")]; tensor reduce_mean_0_axes_0 = const()[name = tensor("reduce_mean_0_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_0_keep_dims_0 = const()[name = tensor("reduce_mean_0_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_0_cast_fp16 = reduce_mean(axes = reduce_mean_0_axes_0, keep_dims = reduce_mean_0_keep_dims_0, x = reshape_0_cast_fp16)[name = tensor("reduce_mean_0_cast_fp16")]; tensor sub_0_cast_fp16 = sub(x = reshape_0_cast_fp16, y = reduce_mean_0_cast_fp16)[name = tensor("sub_0_cast_fp16")]; tensor square_0_cast_fp16 = square(x = sub_0_cast_fp16)[name = tensor("square_0_cast_fp16")]; tensor reduce_mean_2_axes_0 = const()[name = tensor("reduce_mean_2_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_2_keep_dims_0 = const()[name = tensor("reduce_mean_2_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_2_cast_fp16 = reduce_mean(axes = reduce_mean_2_axes_0, keep_dims = reduce_mean_2_keep_dims_0, x = square_0_cast_fp16)[name = tensor("reduce_mean_2_cast_fp16")]; tensor add_0_y_0_to_fp16 = const()[name = tensor("add_0_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_0_cast_fp16 = add(x = reduce_mean_2_cast_fp16, y = add_0_y_0_to_fp16)[name = tensor("add_0_cast_fp16")]; tensor sqrt_0_cast_fp16 = sqrt(x = add_0_cast_fp16)[name = tensor("sqrt_0_cast_fp16")]; tensor real_div_0_cast_fp16 = real_div(x = sub_0_cast_fp16, y = sqrt_0_cast_fp16)[name = tensor("real_div_0_cast_fp16")]; tensor reshape_1_shape_0 = const()[name = tensor("reshape_1_shape_0"), val = tensor([2, 320, 48, 48])]; tensor reshape_1_cast_fp16 = reshape(shape = reshape_1_shape_0, x = real_div_0_cast_fp16)[name = tensor("reshape_1_cast_fp16")]; tensor add_1_mean_0_to_fp16 = const()[name = tensor("add_1_mean_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4125632)))]; tensor add_1_variance_0_to_fp16 = const()[name = tensor("add_1_variance_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4126336)))]; tensor add_1_gamma_0_to_fp16 = const()[name = tensor("add_1_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4127040)))]; tensor add_1_beta_0_to_fp16 = const()[name = tensor("add_1_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4127744)))]; tensor add_1_epsilon_0_to_fp16 = const()[name = tensor("add_1_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_1_cast_fp16 = batch_norm(beta = add_1_beta_0_to_fp16, epsilon = add_1_epsilon_0_to_fp16, gamma = add_1_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_1_cast_fp16)[name = tensor("add_1_cast_fp16")]; tensor input_11_cast_fp16 = silu(x = add_1_cast_fp16)[name = tensor("input_11_cast_fp16")]; tensor var_134 = const()[name = tensor("op_134"), val = tensor([1, 1])]; tensor var_136 = const()[name = tensor("op_136"), val = tensor([1, 1])]; tensor hidden_states_1_pad_type_0 = const()[name = tensor("hidden_states_1_pad_type_0"), val = tensor("custom")]; tensor hidden_states_1_pad_0 = const()[name = tensor("hidden_states_1_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_0_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4128448)))]; tensor down_blocks_0_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5971712)))]; tensor hidden_states_1_cast_fp16 = conv(bias = down_blocks_0_resnets_0_conv1_bias_to_fp16, dilations = var_136, groups = var_112, pad = hidden_states_1_pad_0, pad_type = hidden_states_1_pad_type_0, strides = var_134, weight = down_blocks_0_resnets_0_conv1_weight_to_fp16, x = input_11_cast_fp16)[name = tensor("hidden_states_1_cast_fp16")]; tensor input_15_cast_fp16_1 = silu(x = input_13_cast_fp16)[name = tensor("input_15_cast_fp16")]; tensor var_142 = const()[name = tensor("op_142"), val = tensor([1, 1])]; tensor var_144 = const()[name = tensor("op_144"), val = tensor([1, 1])]; tensor temb_1_pad_type_0 = const()[name = tensor("temb_1_pad_type_0"), val = tensor("custom")]; tensor temb_1_pad_0 = const()[name = tensor("temb_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5972416)))]; tensor down_blocks_0_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6791680)))]; tensor temb_1_cast_fp16 = conv(bias = down_blocks_0_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_144, groups = var_112, pad = temb_1_pad_0, pad_type = temb_1_pad_type_0, strides = var_142, weight = down_blocks_0_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_1_cast_fp16")]; tensor input_17_cast_fp16 = add(x = hidden_states_1_cast_fp16, y = temb_1_cast_fp16)[name = tensor("input_17_cast_fp16")]; tensor reshape_4_shape_0 = const()[name = tensor("reshape_4_shape_0"), val = tensor([2, 32, 10, 48, 48])]; tensor reshape_4_cast_fp16 = reshape(shape = reshape_4_shape_0, x = input_17_cast_fp16)[name = tensor("reshape_4_cast_fp16")]; tensor reduce_mean_3_axes_0 = const()[name = tensor("reduce_mean_3_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_3_keep_dims_0 = const()[name = tensor("reduce_mean_3_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_3_cast_fp16 = reduce_mean(axes = reduce_mean_3_axes_0, keep_dims = reduce_mean_3_keep_dims_0, x = reshape_4_cast_fp16)[name = tensor("reduce_mean_3_cast_fp16")]; tensor sub_2_cast_fp16 = sub(x = reshape_4_cast_fp16, y = reduce_mean_3_cast_fp16)[name = tensor("sub_2_cast_fp16")]; tensor square_1_cast_fp16 = square(x = sub_2_cast_fp16)[name = tensor("square_1_cast_fp16")]; tensor reduce_mean_5_axes_0 = const()[name = tensor("reduce_mean_5_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_5_keep_dims_0 = const()[name = tensor("reduce_mean_5_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_5_cast_fp16 = reduce_mean(axes = reduce_mean_5_axes_0, keep_dims = reduce_mean_5_keep_dims_0, x = square_1_cast_fp16)[name = tensor("reduce_mean_5_cast_fp16")]; tensor add_2_y_0_to_fp16 = const()[name = tensor("add_2_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_2_cast_fp16 = add(x = reduce_mean_5_cast_fp16, y = add_2_y_0_to_fp16)[name = tensor("add_2_cast_fp16")]; tensor sqrt_1_cast_fp16 = sqrt(x = add_2_cast_fp16)[name = tensor("sqrt_1_cast_fp16")]; tensor real_div_1_cast_fp16 = real_div(x = sub_2_cast_fp16, y = sqrt_1_cast_fp16)[name = tensor("real_div_1_cast_fp16")]; tensor reshape_5_shape_0 = const()[name = tensor("reshape_5_shape_0"), val = tensor([2, 320, 48, 48])]; tensor reshape_5_cast_fp16 = reshape(shape = reshape_5_shape_0, x = real_div_1_cast_fp16)[name = tensor("reshape_5_cast_fp16")]; tensor add_3_gamma_0_to_fp16 = const()[name = tensor("add_3_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6792384)))]; tensor add_3_beta_0_to_fp16 = const()[name = tensor("add_3_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6793088)))]; tensor add_3_epsilon_0_to_fp16 = const()[name = tensor("add_3_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_3_cast_fp16 = batch_norm(beta = add_3_beta_0_to_fp16, epsilon = add_3_epsilon_0_to_fp16, gamma = add_3_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_5_cast_fp16)[name = tensor("add_3_cast_fp16")]; tensor input_21_cast_fp16 = silu(x = add_3_cast_fp16)[name = tensor("input_21_cast_fp16")]; tensor var_154 = const()[name = tensor("op_154"), val = tensor([1, 1])]; tensor var_156 = const()[name = tensor("op_156"), val = tensor([1, 1])]; tensor hidden_states_3_pad_type_0 = const()[name = tensor("hidden_states_3_pad_type_0"), val = tensor("custom")]; tensor hidden_states_3_pad_0 = const()[name = tensor("hidden_states_3_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_0_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6793792)))]; tensor down_blocks_0_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8637056)))]; tensor hidden_states_3_cast_fp16 = conv(bias = down_blocks_0_resnets_0_conv2_bias_to_fp16, dilations = var_156, groups = var_112, pad = hidden_states_3_pad_0, pad_type = hidden_states_3_pad_type_0, strides = var_154, weight = down_blocks_0_resnets_0_conv2_weight_to_fp16, x = input_21_cast_fp16)[name = tensor("hidden_states_3_cast_fp16")]; tensor hidden_states_5_cast_fp16 = add(x = input_7_cast_fp16_1, y = hidden_states_3_cast_fp16)[name = tensor("hidden_states_5_cast_fp16")]; tensor reshape_8_shape_0 = const()[name = tensor("reshape_8_shape_0"), val = tensor([2, 32, 10, 48, 48])]; tensor reshape_8_cast_fp16 = reshape(shape = reshape_8_shape_0, x = hidden_states_5_cast_fp16)[name = tensor("reshape_8_cast_fp16")]; tensor reduce_mean_6_axes_0 = const()[name = tensor("reduce_mean_6_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_6_keep_dims_0 = const()[name = tensor("reduce_mean_6_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_6_cast_fp16 = reduce_mean(axes = reduce_mean_6_axes_0, keep_dims = reduce_mean_6_keep_dims_0, x = reshape_8_cast_fp16)[name = tensor("reduce_mean_6_cast_fp16")]; tensor sub_4_cast_fp16 = sub(x = reshape_8_cast_fp16, y = reduce_mean_6_cast_fp16)[name = tensor("sub_4_cast_fp16")]; tensor square_2_cast_fp16 = square(x = sub_4_cast_fp16)[name = tensor("square_2_cast_fp16")]; tensor reduce_mean_8_axes_0 = const()[name = tensor("reduce_mean_8_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_8_keep_dims_0 = const()[name = tensor("reduce_mean_8_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_8_cast_fp16 = reduce_mean(axes = reduce_mean_8_axes_0, keep_dims = reduce_mean_8_keep_dims_0, x = square_2_cast_fp16)[name = tensor("reduce_mean_8_cast_fp16")]; tensor add_4_y_0_to_fp16 = const()[name = tensor("add_4_y_0_to_fp16"), val = tensor(0x1.1p-20)]; tensor add_4_cast_fp16 = add(x = reduce_mean_8_cast_fp16, y = add_4_y_0_to_fp16)[name = tensor("add_4_cast_fp16")]; tensor sqrt_2_cast_fp16 = sqrt(x = add_4_cast_fp16)[name = tensor("sqrt_2_cast_fp16")]; tensor real_div_2_cast_fp16 = real_div(x = sub_4_cast_fp16, y = sqrt_2_cast_fp16)[name = tensor("real_div_2_cast_fp16")]; tensor reshape_9_shape_0 = const()[name = tensor("reshape_9_shape_0"), val = tensor([2, 320, 48, 48])]; tensor reshape_9_cast_fp16 = reshape(shape = reshape_9_shape_0, x = real_div_2_cast_fp16)[name = tensor("reshape_9_cast_fp16")]; tensor add_5_gamma_0_to_fp16 = const()[name = tensor("add_5_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8637760)))]; tensor add_5_beta_0_to_fp16 = const()[name = tensor("add_5_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8638464)))]; tensor add_5_epsilon_0_to_fp16 = const()[name = tensor("add_5_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_5_cast_fp16 = batch_norm(beta = add_5_beta_0_to_fp16, epsilon = add_5_epsilon_0_to_fp16, gamma = add_5_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_9_cast_fp16)[name = tensor("add_5_cast_fp16")]; tensor var_176 = const()[name = tensor("op_176"), val = tensor([1, 1])]; tensor var_178 = const()[name = tensor("op_178"), val = tensor([1, 1])]; tensor hidden_states_7_pad_type_0 = const()[name = tensor("hidden_states_7_pad_type_0"), val = tensor("custom")]; tensor hidden_states_7_pad_0 = const()[name = tensor("hidden_states_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8639168)))]; tensor down_blocks_0_attentions_0_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8844032)))]; tensor hidden_states_7_cast_fp16 = conv(bias = down_blocks_0_attentions_0_proj_in_bias_to_fp16, dilations = var_178, groups = var_112, pad = hidden_states_7_pad_0, pad_type = hidden_states_7_pad_type_0, strides = var_176, weight = down_blocks_0_attentions_0_proj_in_weight_to_fp16, x = add_5_cast_fp16)[name = tensor("hidden_states_7_cast_fp16")]; tensor var_183 = const()[name = tensor("op_183"), val = tensor([2, 320, 1, 2304])]; tensor inputs_1_cast_fp16 = reshape(shape = var_183, x = hidden_states_7_cast_fp16)[name = tensor("inputs_1_cast_fp16")]; tensor var_193 = const()[name = tensor("op_193"), val = tensor([1])]; tensor channels_mean_1_cast_fp16 = reduce_mean(axes = var_193, keep_dims = var_107, x = inputs_1_cast_fp16)[name = tensor("channels_mean_1_cast_fp16")]; tensor zero_mean_1_cast_fp16 = sub(x = inputs_1_cast_fp16, y = channels_mean_1_cast_fp16)[name = tensor("zero_mean_1_cast_fp16")]; tensor zero_mean_sq_1_cast_fp16 = mul(x = zero_mean_1_cast_fp16, y = zero_mean_1_cast_fp16)[name = tensor("zero_mean_sq_1_cast_fp16")]; tensor var_197 = const()[name = tensor("op_197"), val = tensor([1])]; tensor var_198_cast_fp16 = reduce_mean(axes = var_197, keep_dims = var_107, x = zero_mean_sq_1_cast_fp16)[name = tensor("op_198_cast_fp16")]; tensor var_199_to_fp16 = const()[name = tensor("op_199_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_200_cast_fp16 = add(x = var_198_cast_fp16, y = var_199_to_fp16)[name = tensor("op_200_cast_fp16")]; tensor denom_1_epsilon_0_to_fp16 = const()[name = tensor("denom_1_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_1_cast_fp16 = rsqrt(epsilon = denom_1_epsilon_0_to_fp16, x = var_200_cast_fp16)[name = tensor("denom_1_cast_fp16")]; tensor out_1_cast_fp16 = mul(x = zero_mean_1_cast_fp16, y = denom_1_cast_fp16)[name = tensor("out_1_cast_fp16")]; tensor var_204_to_fp16 = const()[name = tensor("op_204_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8844736)))]; tensor var_205_cast_fp16 = add(x = out_1_cast_fp16, y = var_204_to_fp16)[name = tensor("op_205_cast_fp16")]; tensor var_207_to_fp16 = const()[name = tensor("op_207_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8845440)))]; tensor hidden_states_9_cast_fp16 = mul(x = var_205_cast_fp16, y = var_207_to_fp16)[name = tensor("hidden_states_9_cast_fp16")]; tensor var_214 = const()[name = tensor("op_214"), val = tensor([1, 1])]; tensor var_216 = const()[name = tensor("op_216"), val = tensor([1, 1])]; tensor q_1_pad_type_0 = const()[name = tensor("q_1_pad_type_0"), val = tensor("custom")]; tensor q_1_pad_0 = const()[name = tensor("q_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8846144)))]; tensor q_1_cast_fp16 = conv(dilations = var_216, groups = var_112, pad = q_1_pad_0, pad_type = q_1_pad_type_0, strides = var_214, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_9_cast_fp16)[name = tensor("q_1_cast_fp16")]; tensor var_220 = const()[name = tensor("op_220"), val = tensor([1, 1])]; tensor var_222 = const()[name = tensor("op_222"), val = tensor([1, 1])]; tensor k_1_pad_type_0 = const()[name = tensor("k_1_pad_type_0"), val = tensor("custom")]; tensor k_1_pad_0 = const()[name = tensor("k_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9051008)))]; tensor k_1_cast_fp16 = conv(dilations = var_222, groups = var_112, pad = k_1_pad_0, pad_type = k_1_pad_type_0, strides = var_220, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_9_cast_fp16)[name = tensor("k_1_cast_fp16")]; tensor var_226 = const()[name = tensor("op_226"), val = tensor([1, 1])]; tensor var_228 = const()[name = tensor("op_228"), val = tensor([1, 1])]; tensor v_1_pad_type_0 = const()[name = tensor("v_1_pad_type_0"), val = tensor("custom")]; tensor v_1_pad_0 = const()[name = tensor("v_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9255872)))]; tensor v_1_cast_fp16 = conv(dilations = var_228, groups = var_112, pad = v_1_pad_0, pad_type = v_1_pad_type_0, strides = var_226, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_9_cast_fp16)[name = tensor("v_1_cast_fp16")]; tensor var_232_begin_0 = const()[name = tensor("op_232_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_232_end_0 = const()[name = tensor("op_232_end_0"), val = tensor([2, 64, 1, 2304])]; tensor var_232_end_mask_0 = const()[name = tensor("op_232_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_232_cast_fp16 = slice_by_index(begin = var_232_begin_0, end = var_232_end_0, end_mask = var_232_end_mask_0, x = q_1_cast_fp16)[name = tensor("op_232_cast_fp16")]; tensor var_236_begin_0 = const()[name = tensor("op_236_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_236_end_0 = const()[name = tensor("op_236_end_0"), val = tensor([2, 128, 1, 2304])]; tensor var_236_end_mask_0 = const()[name = tensor("op_236_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_236_cast_fp16 = slice_by_index(begin = var_236_begin_0, end = var_236_end_0, end_mask = var_236_end_mask_0, x = q_1_cast_fp16)[name = tensor("op_236_cast_fp16")]; tensor var_240_begin_0 = const()[name = tensor("op_240_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_240_end_0 = const()[name = tensor("op_240_end_0"), val = tensor([2, 192, 1, 2304])]; tensor var_240_end_mask_0 = const()[name = tensor("op_240_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_240_cast_fp16 = slice_by_index(begin = var_240_begin_0, end = var_240_end_0, end_mask = var_240_end_mask_0, x = q_1_cast_fp16)[name = tensor("op_240_cast_fp16")]; tensor var_244_begin_0 = const()[name = tensor("op_244_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_244_end_0 = const()[name = tensor("op_244_end_0"), val = tensor([2, 256, 1, 2304])]; tensor var_244_end_mask_0 = const()[name = tensor("op_244_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_244_cast_fp16 = slice_by_index(begin = var_244_begin_0, end = var_244_end_0, end_mask = var_244_end_mask_0, x = q_1_cast_fp16)[name = tensor("op_244_cast_fp16")]; tensor var_248_begin_0 = const()[name = tensor("op_248_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_248_end_0 = const()[name = tensor("op_248_end_0"), val = tensor([2, 320, 1, 2304])]; tensor var_248_end_mask_0 = const()[name = tensor("op_248_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_248_cast_fp16 = slice_by_index(begin = var_248_begin_0, end = var_248_end_0, end_mask = var_248_end_mask_0, x = q_1_cast_fp16)[name = tensor("op_248_cast_fp16")]; tensor k_3_perm_0 = const()[name = tensor("k_3_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_255_begin_0 = const()[name = tensor("op_255_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_255_end_0 = const()[name = tensor("op_255_end_0"), val = tensor([2, 2304, 1, 64])]; tensor var_255_end_mask_0 = const()[name = tensor("op_255_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_13 = transpose(perm = k_3_perm_0, x = k_1_cast_fp16)[name = tensor("transpose_13")]; tensor var_255_cast_fp16 = slice_by_index(begin = var_255_begin_0, end = var_255_end_0, end_mask = var_255_end_mask_0, x = transpose_13)[name = tensor("op_255_cast_fp16")]; tensor var_259_begin_0 = const()[name = tensor("op_259_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_259_end_0 = const()[name = tensor("op_259_end_0"), val = tensor([2, 2304, 1, 128])]; tensor var_259_end_mask_0 = const()[name = tensor("op_259_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_259_cast_fp16 = slice_by_index(begin = var_259_begin_0, end = var_259_end_0, end_mask = var_259_end_mask_0, x = transpose_13)[name = tensor("op_259_cast_fp16")]; tensor var_263_begin_0 = const()[name = tensor("op_263_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_263_end_0 = const()[name = tensor("op_263_end_0"), val = tensor([2, 2304, 1, 192])]; tensor var_263_end_mask_0 = const()[name = tensor("op_263_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_263_cast_fp16 = slice_by_index(begin = var_263_begin_0, end = var_263_end_0, end_mask = var_263_end_mask_0, x = transpose_13)[name = tensor("op_263_cast_fp16")]; tensor var_267_begin_0 = const()[name = tensor("op_267_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_267_end_0 = const()[name = tensor("op_267_end_0"), val = tensor([2, 2304, 1, 256])]; tensor var_267_end_mask_0 = const()[name = tensor("op_267_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_267_cast_fp16 = slice_by_index(begin = var_267_begin_0, end = var_267_end_0, end_mask = var_267_end_mask_0, x = transpose_13)[name = tensor("op_267_cast_fp16")]; tensor var_271_begin_0 = const()[name = tensor("op_271_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_271_end_0 = const()[name = tensor("op_271_end_0"), val = tensor([2, 2304, 1, 320])]; tensor var_271_end_mask_0 = const()[name = tensor("op_271_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_271_cast_fp16 = slice_by_index(begin = var_271_begin_0, end = var_271_end_0, end_mask = var_271_end_mask_0, x = transpose_13)[name = tensor("op_271_cast_fp16")]; tensor var_273_begin_0 = const()[name = tensor("op_273_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_273_end_0 = const()[name = tensor("op_273_end_0"), val = tensor([2, 64, 1, 2304])]; tensor var_273_end_mask_0 = const()[name = tensor("op_273_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_273_cast_fp16 = slice_by_index(begin = var_273_begin_0, end = var_273_end_0, end_mask = var_273_end_mask_0, x = v_1_cast_fp16)[name = tensor("op_273_cast_fp16")]; tensor var_277_begin_0 = const()[name = tensor("op_277_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_277_end_0 = const()[name = tensor("op_277_end_0"), val = tensor([2, 128, 1, 2304])]; tensor var_277_end_mask_0 = const()[name = tensor("op_277_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_277_cast_fp16 = slice_by_index(begin = var_277_begin_0, end = var_277_end_0, end_mask = var_277_end_mask_0, x = v_1_cast_fp16)[name = tensor("op_277_cast_fp16")]; tensor var_281_begin_0 = const()[name = tensor("op_281_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_281_end_0 = const()[name = tensor("op_281_end_0"), val = tensor([2, 192, 1, 2304])]; tensor var_281_end_mask_0 = const()[name = tensor("op_281_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_281_cast_fp16 = slice_by_index(begin = var_281_begin_0, end = var_281_end_0, end_mask = var_281_end_mask_0, x = v_1_cast_fp16)[name = tensor("op_281_cast_fp16")]; tensor var_285_begin_0 = const()[name = tensor("op_285_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_285_end_0 = const()[name = tensor("op_285_end_0"), val = tensor([2, 256, 1, 2304])]; tensor var_285_end_mask_0 = const()[name = tensor("op_285_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_285_cast_fp16 = slice_by_index(begin = var_285_begin_0, end = var_285_end_0, end_mask = var_285_end_mask_0, x = v_1_cast_fp16)[name = tensor("op_285_cast_fp16")]; tensor var_289_begin_0 = const()[name = tensor("op_289_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_289_end_0 = const()[name = tensor("op_289_end_0"), val = tensor([2, 320, 1, 2304])]; tensor var_289_end_mask_0 = const()[name = tensor("op_289_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_289_cast_fp16 = slice_by_index(begin = var_289_begin_0, end = var_289_end_0, end_mask = var_289_end_mask_0, x = v_1_cast_fp16)[name = tensor("op_289_cast_fp16")]; tensor var_293_equation_0 = const()[name = tensor("op_293_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_293_cast_fp16 = einsum(equation = var_293_equation_0, values = (var_255_cast_fp16, var_232_cast_fp16))[name = tensor("op_293_cast_fp16")]; tensor var_294_to_fp16 = const()[name = tensor("op_294_to_fp16"), val = tensor(0x1p-3)]; tensor aw_1_cast_fp16 = mul(x = var_293_cast_fp16, y = var_294_to_fp16)[name = tensor("aw_1_cast_fp16")]; tensor var_297_equation_0 = const()[name = tensor("op_297_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_297_cast_fp16 = einsum(equation = var_297_equation_0, values = (var_259_cast_fp16, var_236_cast_fp16))[name = tensor("op_297_cast_fp16")]; tensor var_298_to_fp16 = const()[name = tensor("op_298_to_fp16"), val = tensor(0x1p-3)]; tensor aw_3_cast_fp16 = mul(x = var_297_cast_fp16, y = var_298_to_fp16)[name = tensor("aw_3_cast_fp16")]; tensor var_301_equation_0 = const()[name = tensor("op_301_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_301_cast_fp16 = einsum(equation = var_301_equation_0, values = (var_263_cast_fp16, var_240_cast_fp16))[name = tensor("op_301_cast_fp16")]; tensor var_302_to_fp16 = const()[name = tensor("op_302_to_fp16"), val = tensor(0x1p-3)]; tensor aw_5_cast_fp16 = mul(x = var_301_cast_fp16, y = var_302_to_fp16)[name = tensor("aw_5_cast_fp16")]; tensor var_305_equation_0 = const()[name = tensor("op_305_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_305_cast_fp16 = einsum(equation = var_305_equation_0, values = (var_267_cast_fp16, var_244_cast_fp16))[name = tensor("op_305_cast_fp16")]; tensor var_306_to_fp16 = const()[name = tensor("op_306_to_fp16"), val = tensor(0x1p-3)]; tensor aw_7_cast_fp16 = mul(x = var_305_cast_fp16, y = var_306_to_fp16)[name = tensor("aw_7_cast_fp16")]; tensor var_309_equation_0 = const()[name = tensor("op_309_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_309_cast_fp16 = einsum(equation = var_309_equation_0, values = (var_271_cast_fp16, var_248_cast_fp16))[name = tensor("op_309_cast_fp16")]; tensor var_310_to_fp16 = const()[name = tensor("op_310_to_fp16"), val = tensor(0x1p-3)]; tensor aw_9_cast_fp16 = mul(x = var_309_cast_fp16, y = var_310_to_fp16)[name = tensor("aw_9_cast_fp16")]; tensor var_312_cast_fp16 = softmax(axis = var_112, x = aw_1_cast_fp16)[name = tensor("op_312_cast_fp16")]; tensor var_313_cast_fp16 = softmax(axis = var_112, x = aw_3_cast_fp16)[name = tensor("op_313_cast_fp16")]; tensor var_314_cast_fp16 = softmax(axis = var_112, x = aw_5_cast_fp16)[name = tensor("op_314_cast_fp16")]; tensor var_315_cast_fp16 = softmax(axis = var_112, x = aw_7_cast_fp16)[name = tensor("op_315_cast_fp16")]; tensor var_316_cast_fp16 = softmax(axis = var_112, x = aw_9_cast_fp16)[name = tensor("op_316_cast_fp16")]; tensor var_318_equation_0 = const()[name = tensor("op_318_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_318_cast_fp16 = einsum(equation = var_318_equation_0, values = (var_273_cast_fp16, var_312_cast_fp16))[name = tensor("op_318_cast_fp16")]; tensor var_320_equation_0 = const()[name = tensor("op_320_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_320_cast_fp16 = einsum(equation = var_320_equation_0, values = (var_277_cast_fp16, var_313_cast_fp16))[name = tensor("op_320_cast_fp16")]; tensor var_322_equation_0 = const()[name = tensor("op_322_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_322_cast_fp16 = einsum(equation = var_322_equation_0, values = (var_281_cast_fp16, var_314_cast_fp16))[name = tensor("op_322_cast_fp16")]; tensor var_324_equation_0 = const()[name = tensor("op_324_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_324_cast_fp16 = einsum(equation = var_324_equation_0, values = (var_285_cast_fp16, var_315_cast_fp16))[name = tensor("op_324_cast_fp16")]; tensor var_326_equation_0 = const()[name = tensor("op_326_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_326_cast_fp16 = einsum(equation = var_326_equation_0, values = (var_289_cast_fp16, var_316_cast_fp16))[name = tensor("op_326_cast_fp16")]; tensor input_25_interleave_0 = const()[name = tensor("input_25_interleave_0"), val = tensor(false)]; tensor input_25_cast_fp16 = concat(axis = var_112, interleave = input_25_interleave_0, values = (var_318_cast_fp16, var_320_cast_fp16, var_322_cast_fp16, var_324_cast_fp16, var_326_cast_fp16))[name = tensor("input_25_cast_fp16")]; tensor var_332 = const()[name = tensor("op_332"), val = tensor([1, 1])]; tensor var_334 = const()[name = tensor("op_334"), val = tensor([1, 1])]; tensor var_336_pad_type_0 = const()[name = tensor("op_336_pad_type_0"), val = tensor("custom")]; tensor var_336_pad_0 = const()[name = tensor("op_336_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9460736)))]; tensor down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9665600)))]; tensor var_336_cast_fp16 = conv(bias = down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_334, groups = var_112, pad = var_336_pad_0, pad_type = var_336_pad_type_0, strides = var_332, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_25_cast_fp16)[name = tensor("op_336_cast_fp16")]; tensor inputs_3_cast_fp16 = add(x = var_336_cast_fp16, y = inputs_1_cast_fp16)[name = tensor("inputs_3_cast_fp16")]; tensor var_340 = const()[name = tensor("op_340"), val = tensor([1])]; tensor channels_mean_3_cast_fp16 = reduce_mean(axes = var_340, keep_dims = var_107, x = inputs_3_cast_fp16)[name = tensor("channels_mean_3_cast_fp16")]; tensor zero_mean_3_cast_fp16 = sub(x = inputs_3_cast_fp16, y = channels_mean_3_cast_fp16)[name = tensor("zero_mean_3_cast_fp16")]; tensor zero_mean_sq_3_cast_fp16 = mul(x = zero_mean_3_cast_fp16, y = zero_mean_3_cast_fp16)[name = tensor("zero_mean_sq_3_cast_fp16")]; tensor var_344 = const()[name = tensor("op_344"), val = tensor([1])]; tensor var_345_cast_fp16 = reduce_mean(axes = var_344, keep_dims = var_107, x = zero_mean_sq_3_cast_fp16)[name = tensor("op_345_cast_fp16")]; tensor var_346_to_fp16 = const()[name = tensor("op_346_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_347_cast_fp16 = add(x = var_345_cast_fp16, y = var_346_to_fp16)[name = tensor("op_347_cast_fp16")]; tensor denom_3_epsilon_0_to_fp16 = const()[name = tensor("denom_3_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_3_cast_fp16 = rsqrt(epsilon = denom_3_epsilon_0_to_fp16, x = var_347_cast_fp16)[name = tensor("denom_3_cast_fp16")]; tensor out_3_cast_fp16 = mul(x = zero_mean_3_cast_fp16, y = denom_3_cast_fp16)[name = tensor("out_3_cast_fp16")]; tensor var_351_to_fp16 = const()[name = tensor("op_351_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9666304)))]; tensor var_352_cast_fp16 = add(x = out_3_cast_fp16, y = var_351_to_fp16)[name = tensor("op_352_cast_fp16")]; tensor var_354_to_fp16 = const()[name = tensor("op_354_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9667008)))]; tensor hidden_states_11_cast_fp16 = mul(x = var_352_cast_fp16, y = var_354_to_fp16)[name = tensor("hidden_states_11_cast_fp16")]; tensor var_361 = const()[name = tensor("op_361"), val = tensor([1, 1])]; tensor var_363 = const()[name = tensor("op_363"), val = tensor([1, 1])]; tensor q_3_pad_type_0 = const()[name = tensor("q_3_pad_type_0"), val = tensor("custom")]; tensor q_3_pad_0 = const()[name = tensor("q_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9667712)))]; tensor q_3_cast_fp16 = conv(dilations = var_363, groups = var_112, pad = q_3_pad_0, pad_type = q_3_pad_type_0, strides = var_361, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_11_cast_fp16)[name = tensor("q_3_cast_fp16")]; tensor var_367 = const()[name = tensor("op_367"), val = tensor([1, 1])]; tensor var_369 = const()[name = tensor("op_369"), val = tensor([1, 1])]; tensor k_5_pad_type_0 = const()[name = tensor("k_5_pad_type_0"), val = tensor("custom")]; tensor k_5_pad_0 = const()[name = tensor("k_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9872576)))]; tensor k_5_cast_fp16 = conv(dilations = var_369, groups = var_112, pad = k_5_pad_0, pad_type = k_5_pad_type_0, strides = var_367, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_5_cast_fp16")]; tensor var_373 = const()[name = tensor("op_373"), val = tensor([1, 1])]; tensor var_375 = const()[name = tensor("op_375"), val = tensor([1, 1])]; tensor v_3_pad_type_0 = const()[name = tensor("v_3_pad_type_0"), val = tensor("custom")]; tensor v_3_pad_0 = const()[name = tensor("v_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10528000)))]; tensor v_3_cast_fp16 = conv(dilations = var_375, groups = var_112, pad = v_3_pad_0, pad_type = v_3_pad_type_0, strides = var_373, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_3_cast_fp16")]; tensor var_379_begin_0 = const()[name = tensor("op_379_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_379_end_0 = const()[name = tensor("op_379_end_0"), val = tensor([2, 64, 1, 2304])]; tensor var_379_end_mask_0 = const()[name = tensor("op_379_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_379_cast_fp16 = slice_by_index(begin = var_379_begin_0, end = var_379_end_0, end_mask = var_379_end_mask_0, x = q_3_cast_fp16)[name = tensor("op_379_cast_fp16")]; tensor var_383_begin_0 = const()[name = tensor("op_383_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_383_end_0 = const()[name = tensor("op_383_end_0"), val = tensor([2, 128, 1, 2304])]; tensor var_383_end_mask_0 = const()[name = tensor("op_383_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_383_cast_fp16 = slice_by_index(begin = var_383_begin_0, end = var_383_end_0, end_mask = var_383_end_mask_0, x = q_3_cast_fp16)[name = tensor("op_383_cast_fp16")]; tensor var_387_begin_0 = const()[name = tensor("op_387_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_387_end_0 = const()[name = tensor("op_387_end_0"), val = tensor([2, 192, 1, 2304])]; tensor var_387_end_mask_0 = const()[name = tensor("op_387_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_387_cast_fp16 = slice_by_index(begin = var_387_begin_0, end = var_387_end_0, end_mask = var_387_end_mask_0, x = q_3_cast_fp16)[name = tensor("op_387_cast_fp16")]; tensor var_391_begin_0 = const()[name = tensor("op_391_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_391_end_0 = const()[name = tensor("op_391_end_0"), val = tensor([2, 256, 1, 2304])]; tensor var_391_end_mask_0 = const()[name = tensor("op_391_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_391_cast_fp16 = slice_by_index(begin = var_391_begin_0, end = var_391_end_0, end_mask = var_391_end_mask_0, x = q_3_cast_fp16)[name = tensor("op_391_cast_fp16")]; tensor var_395_begin_0 = const()[name = tensor("op_395_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_395_end_0 = const()[name = tensor("op_395_end_0"), val = tensor([2, 320, 1, 2304])]; tensor var_395_end_mask_0 = const()[name = tensor("op_395_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_395_cast_fp16 = slice_by_index(begin = var_395_begin_0, end = var_395_end_0, end_mask = var_395_end_mask_0, x = q_3_cast_fp16)[name = tensor("op_395_cast_fp16")]; tensor k_7_perm_0 = const()[name = tensor("k_7_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_402_begin_0 = const()[name = tensor("op_402_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_402_end_0 = const()[name = tensor("op_402_end_0"), val = tensor([2, 77, 1, 64])]; tensor var_402_end_mask_0 = const()[name = tensor("op_402_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_12 = transpose(perm = k_7_perm_0, x = k_5_cast_fp16)[name = tensor("transpose_12")]; tensor var_402_cast_fp16 = slice_by_index(begin = var_402_begin_0, end = var_402_end_0, end_mask = var_402_end_mask_0, x = transpose_12)[name = tensor("op_402_cast_fp16")]; tensor var_406_begin_0 = const()[name = tensor("op_406_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_406_end_0 = const()[name = tensor("op_406_end_0"), val = tensor([2, 77, 1, 128])]; tensor var_406_end_mask_0 = const()[name = tensor("op_406_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_406_cast_fp16 = slice_by_index(begin = var_406_begin_0, end = var_406_end_0, end_mask = var_406_end_mask_0, x = transpose_12)[name = tensor("op_406_cast_fp16")]; tensor var_410_begin_0 = const()[name = tensor("op_410_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_410_end_0 = const()[name = tensor("op_410_end_0"), val = tensor([2, 77, 1, 192])]; tensor var_410_end_mask_0 = const()[name = tensor("op_410_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_410_cast_fp16 = slice_by_index(begin = var_410_begin_0, end = var_410_end_0, end_mask = var_410_end_mask_0, x = transpose_12)[name = tensor("op_410_cast_fp16")]; tensor var_414_begin_0 = const()[name = tensor("op_414_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_414_end_0 = const()[name = tensor("op_414_end_0"), val = tensor([2, 77, 1, 256])]; tensor var_414_end_mask_0 = const()[name = tensor("op_414_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_414_cast_fp16 = slice_by_index(begin = var_414_begin_0, end = var_414_end_0, end_mask = var_414_end_mask_0, x = transpose_12)[name = tensor("op_414_cast_fp16")]; tensor var_418_begin_0 = const()[name = tensor("op_418_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_418_end_0 = const()[name = tensor("op_418_end_0"), val = tensor([2, 77, 1, 320])]; tensor var_418_end_mask_0 = const()[name = tensor("op_418_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_418_cast_fp16 = slice_by_index(begin = var_418_begin_0, end = var_418_end_0, end_mask = var_418_end_mask_0, x = transpose_12)[name = tensor("op_418_cast_fp16")]; tensor var_420_begin_0 = const()[name = tensor("op_420_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_420_end_0 = const()[name = tensor("op_420_end_0"), val = tensor([2, 64, 1, 77])]; tensor var_420_end_mask_0 = const()[name = tensor("op_420_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_420_cast_fp16 = slice_by_index(begin = var_420_begin_0, end = var_420_end_0, end_mask = var_420_end_mask_0, x = v_3_cast_fp16)[name = tensor("op_420_cast_fp16")]; tensor var_424_begin_0 = const()[name = tensor("op_424_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_424_end_0 = const()[name = tensor("op_424_end_0"), val = tensor([2, 128, 1, 77])]; tensor var_424_end_mask_0 = const()[name = tensor("op_424_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_424_cast_fp16 = slice_by_index(begin = var_424_begin_0, end = var_424_end_0, end_mask = var_424_end_mask_0, x = v_3_cast_fp16)[name = tensor("op_424_cast_fp16")]; tensor var_428_begin_0 = const()[name = tensor("op_428_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_428_end_0 = const()[name = tensor("op_428_end_0"), val = tensor([2, 192, 1, 77])]; tensor var_428_end_mask_0 = const()[name = tensor("op_428_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_428_cast_fp16 = slice_by_index(begin = var_428_begin_0, end = var_428_end_0, end_mask = var_428_end_mask_0, x = v_3_cast_fp16)[name = tensor("op_428_cast_fp16")]; tensor var_432_begin_0 = const()[name = tensor("op_432_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_432_end_0 = const()[name = tensor("op_432_end_0"), val = tensor([2, 256, 1, 77])]; tensor var_432_end_mask_0 = const()[name = tensor("op_432_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_432_cast_fp16 = slice_by_index(begin = var_432_begin_0, end = var_432_end_0, end_mask = var_432_end_mask_0, x = v_3_cast_fp16)[name = tensor("op_432_cast_fp16")]; tensor var_436_begin_0 = const()[name = tensor("op_436_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_436_end_0 = const()[name = tensor("op_436_end_0"), val = tensor([2, 320, 1, 77])]; tensor var_436_end_mask_0 = const()[name = tensor("op_436_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_436_cast_fp16 = slice_by_index(begin = var_436_begin_0, end = var_436_end_0, end_mask = var_436_end_mask_0, x = v_3_cast_fp16)[name = tensor("op_436_cast_fp16")]; tensor var_440_equation_0 = const()[name = tensor("op_440_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_440_cast_fp16 = einsum(equation = var_440_equation_0, values = (var_402_cast_fp16, var_379_cast_fp16))[name = tensor("op_440_cast_fp16")]; tensor var_441_to_fp16 = const()[name = tensor("op_441_to_fp16"), val = tensor(0x1p-3)]; tensor aw_11_cast_fp16 = mul(x = var_440_cast_fp16, y = var_441_to_fp16)[name = tensor("aw_11_cast_fp16")]; tensor var_444_equation_0 = const()[name = tensor("op_444_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_444_cast_fp16 = einsum(equation = var_444_equation_0, values = (var_406_cast_fp16, var_383_cast_fp16))[name = tensor("op_444_cast_fp16")]; tensor var_445_to_fp16 = const()[name = tensor("op_445_to_fp16"), val = tensor(0x1p-3)]; tensor aw_13_cast_fp16 = mul(x = var_444_cast_fp16, y = var_445_to_fp16)[name = tensor("aw_13_cast_fp16")]; tensor var_448_equation_0 = const()[name = tensor("op_448_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_448_cast_fp16 = einsum(equation = var_448_equation_0, values = (var_410_cast_fp16, var_387_cast_fp16))[name = tensor("op_448_cast_fp16")]; tensor var_449_to_fp16 = const()[name = tensor("op_449_to_fp16"), val = tensor(0x1p-3)]; tensor aw_15_cast_fp16 = mul(x = var_448_cast_fp16, y = var_449_to_fp16)[name = tensor("aw_15_cast_fp16")]; tensor var_452_equation_0 = const()[name = tensor("op_452_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_452_cast_fp16 = einsum(equation = var_452_equation_0, values = (var_414_cast_fp16, var_391_cast_fp16))[name = tensor("op_452_cast_fp16")]; tensor var_453_to_fp16 = const()[name = tensor("op_453_to_fp16"), val = tensor(0x1p-3)]; tensor aw_17_cast_fp16 = mul(x = var_452_cast_fp16, y = var_453_to_fp16)[name = tensor("aw_17_cast_fp16")]; tensor var_456_equation_0 = const()[name = tensor("op_456_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_456_cast_fp16 = einsum(equation = var_456_equation_0, values = (var_418_cast_fp16, var_395_cast_fp16))[name = tensor("op_456_cast_fp16")]; tensor var_457_to_fp16 = const()[name = tensor("op_457_to_fp16"), val = tensor(0x1p-3)]; tensor aw_19_cast_fp16 = mul(x = var_456_cast_fp16, y = var_457_to_fp16)[name = tensor("aw_19_cast_fp16")]; tensor var_459_cast_fp16 = softmax(axis = var_112, x = aw_11_cast_fp16)[name = tensor("op_459_cast_fp16")]; tensor var_460_cast_fp16 = softmax(axis = var_112, x = aw_13_cast_fp16)[name = tensor("op_460_cast_fp16")]; tensor var_461_cast_fp16 = softmax(axis = var_112, x = aw_15_cast_fp16)[name = tensor("op_461_cast_fp16")]; tensor var_462_cast_fp16 = softmax(axis = var_112, x = aw_17_cast_fp16)[name = tensor("op_462_cast_fp16")]; tensor var_463_cast_fp16 = softmax(axis = var_112, x = aw_19_cast_fp16)[name = tensor("op_463_cast_fp16")]; tensor var_465_equation_0 = const()[name = tensor("op_465_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_465_cast_fp16 = einsum(equation = var_465_equation_0, values = (var_420_cast_fp16, var_459_cast_fp16))[name = tensor("op_465_cast_fp16")]; tensor var_467_equation_0 = const()[name = tensor("op_467_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_467_cast_fp16 = einsum(equation = var_467_equation_0, values = (var_424_cast_fp16, var_460_cast_fp16))[name = tensor("op_467_cast_fp16")]; tensor var_469_equation_0 = const()[name = tensor("op_469_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_469_cast_fp16 = einsum(equation = var_469_equation_0, values = (var_428_cast_fp16, var_461_cast_fp16))[name = tensor("op_469_cast_fp16")]; tensor var_471_equation_0 = const()[name = tensor("op_471_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_471_cast_fp16 = einsum(equation = var_471_equation_0, values = (var_432_cast_fp16, var_462_cast_fp16))[name = tensor("op_471_cast_fp16")]; tensor var_473_equation_0 = const()[name = tensor("op_473_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_473_cast_fp16 = einsum(equation = var_473_equation_0, values = (var_436_cast_fp16, var_463_cast_fp16))[name = tensor("op_473_cast_fp16")]; tensor input_27_interleave_0 = const()[name = tensor("input_27_interleave_0"), val = tensor(false)]; tensor input_27_cast_fp16 = concat(axis = var_112, interleave = input_27_interleave_0, values = (var_465_cast_fp16, var_467_cast_fp16, var_469_cast_fp16, var_471_cast_fp16, var_473_cast_fp16))[name = tensor("input_27_cast_fp16")]; tensor var_479 = const()[name = tensor("op_479"), val = tensor([1, 1])]; tensor var_481 = const()[name = tensor("op_481"), val = tensor([1, 1])]; tensor var_483_pad_type_0 = const()[name = tensor("op_483_pad_type_0"), val = tensor("custom")]; tensor var_483_pad_0 = const()[name = tensor("op_483_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11183424)))]; tensor down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11388288)))]; tensor var_483_cast_fp16 = conv(bias = down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_481, groups = var_112, pad = var_483_pad_0, pad_type = var_483_pad_type_0, strides = var_479, weight = down_blocks_0_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_27_cast_fp16)[name = tensor("op_483_cast_fp16")]; tensor inputs_5_cast_fp16 = add(x = var_483_cast_fp16, y = inputs_3_cast_fp16)[name = tensor("inputs_5_cast_fp16")]; tensor var_487 = const()[name = tensor("op_487"), val = tensor([1])]; tensor channels_mean_5_cast_fp16 = reduce_mean(axes = var_487, keep_dims = var_107, x = inputs_5_cast_fp16)[name = tensor("channels_mean_5_cast_fp16")]; tensor zero_mean_5_cast_fp16 = sub(x = inputs_5_cast_fp16, y = channels_mean_5_cast_fp16)[name = tensor("zero_mean_5_cast_fp16")]; tensor zero_mean_sq_5_cast_fp16 = mul(x = zero_mean_5_cast_fp16, y = zero_mean_5_cast_fp16)[name = tensor("zero_mean_sq_5_cast_fp16")]; tensor var_491 = const()[name = tensor("op_491"), val = tensor([1])]; tensor var_492_cast_fp16 = reduce_mean(axes = var_491, keep_dims = var_107, x = zero_mean_sq_5_cast_fp16)[name = tensor("op_492_cast_fp16")]; tensor var_493_to_fp16 = const()[name = tensor("op_493_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_494_cast_fp16 = add(x = var_492_cast_fp16, y = var_493_to_fp16)[name = tensor("op_494_cast_fp16")]; tensor denom_5_epsilon_0_to_fp16 = const()[name = tensor("denom_5_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_5_cast_fp16 = rsqrt(epsilon = denom_5_epsilon_0_to_fp16, x = var_494_cast_fp16)[name = tensor("denom_5_cast_fp16")]; tensor out_5_cast_fp16 = mul(x = zero_mean_5_cast_fp16, y = denom_5_cast_fp16)[name = tensor("out_5_cast_fp16")]; tensor var_498_to_fp16 = const()[name = tensor("op_498_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11388992)))]; tensor var_499_cast_fp16 = add(x = out_5_cast_fp16, y = var_498_to_fp16)[name = tensor("op_499_cast_fp16")]; tensor var_501_to_fp16 = const()[name = tensor("op_501_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11389696)))]; tensor input_29_cast_fp16 = mul(x = var_499_cast_fp16, y = var_501_to_fp16)[name = tensor("input_29_cast_fp16")]; tensor var_509 = const()[name = tensor("op_509"), val = tensor([1, 1])]; tensor var_511 = const()[name = tensor("op_511"), val = tensor([1, 1])]; tensor var_513_pad_type_0 = const()[name = tensor("op_513_pad_type_0"), val = tensor("custom")]; tensor var_513_pad_0 = const()[name = tensor("op_513_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11390400)))]; tensor down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13028864)))]; tensor var_513_cast_fp16 = conv(bias = down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_511, groups = var_112, pad = var_513_pad_0, pad_type = var_513_pad_type_0, strides = var_509, weight = down_blocks_0_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_29_cast_fp16)[name = tensor("op_513_cast_fp16")]; tensor var_514_split_sizes_0 = const()[name = tensor("op_514_split_sizes_0"), val = tensor([1280, 1280])]; tensor var_514_axis_0 = const()[name = tensor("op_514_axis_0"), val = tensor(1)]; tensor var_514_cast_fp16_0, tensor var_514_cast_fp16_1 = split(axis = var_514_axis_0, split_sizes = var_514_split_sizes_0, x = var_513_cast_fp16)[name = tensor("op_514_cast_fp16")]; tensor var_516_mode_0 = const()[name = tensor("op_516_mode_0"), val = tensor("EXACT")]; tensor var_516_cast_fp16 = gelu(mode = var_516_mode_0, x = var_514_cast_fp16_1)[name = tensor("op_516_cast_fp16")]; tensor input_31_cast_fp16 = mul(x = var_514_cast_fp16_0, y = var_516_cast_fp16)[name = tensor("input_31_cast_fp16")]; tensor var_520 = const()[name = tensor("op_520"), val = tensor([1, 1])]; tensor var_522 = const()[name = tensor("op_522"), val = tensor([1, 1])]; tensor var_524_pad_type_0 = const()[name = tensor("op_524_pad_type_0"), val = tensor("custom")]; tensor var_524_pad_0 = const()[name = tensor("op_524_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13034048)))]; tensor down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13853312)))]; tensor var_524_cast_fp16 = conv(bias = down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_522, groups = var_112, pad = var_524_pad_0, pad_type = var_524_pad_type_0, strides = var_520, weight = down_blocks_0_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_31_cast_fp16)[name = tensor("op_524_cast_fp16")]; tensor hidden_states_15_cast_fp16 = add(x = var_524_cast_fp16, y = inputs_5_cast_fp16)[name = tensor("hidden_states_15_cast_fp16")]; tensor var_526 = const()[name = tensor("op_526"), val = tensor([2, 320, 48, 48])]; tensor input_33_cast_fp16 = reshape(shape = var_526, x = hidden_states_15_cast_fp16)[name = tensor("input_33_cast_fp16")]; tensor var_530 = const()[name = tensor("op_530"), val = tensor([1, 1])]; tensor var_532 = const()[name = tensor("op_532"), val = tensor([1, 1])]; tensor hidden_states_17_pad_type_0 = const()[name = tensor("hidden_states_17_pad_type_0"), val = tensor("custom")]; tensor hidden_states_17_pad_0 = const()[name = tensor("hidden_states_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_0_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13854016)))]; tensor down_blocks_0_attentions_0_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_0_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14058880)))]; tensor hidden_states_17_cast_fp16 = conv(bias = down_blocks_0_attentions_0_proj_out_bias_to_fp16, dilations = var_532, groups = var_112, pad = hidden_states_17_pad_0, pad_type = hidden_states_17_pad_type_0, strides = var_530, weight = down_blocks_0_attentions_0_proj_out_weight_to_fp16, x = input_33_cast_fp16)[name = tensor("hidden_states_17_cast_fp16")]; tensor input_35_cast_fp16_1 = add(x = hidden_states_17_cast_fp16, y = hidden_states_5_cast_fp16)[name = tensor("input_35_cast_fp16")]; tensor reshape_12_shape_0 = const()[name = tensor("reshape_12_shape_0"), val = tensor([2, 32, 10, 48, 48])]; tensor reshape_12_cast_fp16 = reshape(shape = reshape_12_shape_0, x = input_35_cast_fp16_1)[name = tensor("reshape_12_cast_fp16")]; tensor reduce_mean_9_axes_0 = const()[name = tensor("reduce_mean_9_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_9_keep_dims_0 = const()[name = tensor("reduce_mean_9_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_9_cast_fp16 = reduce_mean(axes = reduce_mean_9_axes_0, keep_dims = reduce_mean_9_keep_dims_0, x = reshape_12_cast_fp16)[name = tensor("reduce_mean_9_cast_fp16")]; tensor sub_6_cast_fp16 = sub(x = reshape_12_cast_fp16, y = reduce_mean_9_cast_fp16)[name = tensor("sub_6_cast_fp16")]; tensor square_3_cast_fp16 = square(x = sub_6_cast_fp16)[name = tensor("square_3_cast_fp16")]; tensor reduce_mean_11_axes_0 = const()[name = tensor("reduce_mean_11_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_11_keep_dims_0 = const()[name = tensor("reduce_mean_11_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_11_cast_fp16 = reduce_mean(axes = reduce_mean_11_axes_0, keep_dims = reduce_mean_11_keep_dims_0, x = square_3_cast_fp16)[name = tensor("reduce_mean_11_cast_fp16")]; tensor add_6_y_0_to_fp16 = const()[name = tensor("add_6_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_6_cast_fp16 = add(x = reduce_mean_11_cast_fp16, y = add_6_y_0_to_fp16)[name = tensor("add_6_cast_fp16")]; tensor sqrt_3_cast_fp16 = sqrt(x = add_6_cast_fp16)[name = tensor("sqrt_3_cast_fp16")]; tensor real_div_3_cast_fp16 = real_div(x = sub_6_cast_fp16, y = sqrt_3_cast_fp16)[name = tensor("real_div_3_cast_fp16")]; tensor reshape_13_shape_0 = const()[name = tensor("reshape_13_shape_0"), val = tensor([2, 320, 48, 48])]; tensor reshape_13_cast_fp16 = reshape(shape = reshape_13_shape_0, x = real_div_3_cast_fp16)[name = tensor("reshape_13_cast_fp16")]; tensor add_7_gamma_0_to_fp16 = const()[name = tensor("add_7_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14059584)))]; tensor add_7_beta_0_to_fp16 = const()[name = tensor("add_7_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14060288)))]; tensor add_7_epsilon_0_to_fp16 = const()[name = tensor("add_7_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_7_cast_fp16 = batch_norm(beta = add_7_beta_0_to_fp16, epsilon = add_7_epsilon_0_to_fp16, gamma = add_7_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_13_cast_fp16)[name = tensor("add_7_cast_fp16")]; tensor input_39_cast_fp16 = silu(x = add_7_cast_fp16)[name = tensor("input_39_cast_fp16")]; tensor var_547 = const()[name = tensor("op_547"), val = tensor([1, 1])]; tensor var_549 = const()[name = tensor("op_549"), val = tensor([1, 1])]; tensor hidden_states_19_pad_type_0 = const()[name = tensor("hidden_states_19_pad_type_0"), val = tensor("custom")]; tensor hidden_states_19_pad_0 = const()[name = tensor("hidden_states_19_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_0_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14060992)))]; tensor down_blocks_0_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15904256)))]; tensor hidden_states_19_cast_fp16 = conv(bias = down_blocks_0_resnets_1_conv1_bias_to_fp16, dilations = var_549, groups = var_112, pad = hidden_states_19_pad_0, pad_type = hidden_states_19_pad_type_0, strides = var_547, weight = down_blocks_0_resnets_1_conv1_weight_to_fp16, x = input_39_cast_fp16)[name = tensor("hidden_states_19_cast_fp16")]; tensor var_555 = const()[name = tensor("op_555"), val = tensor([1, 1])]; tensor var_557 = const()[name = tensor("op_557"), val = tensor([1, 1])]; tensor temb_3_pad_type_0 = const()[name = tensor("temb_3_pad_type_0"), val = tensor("custom")]; tensor temb_3_pad_0 = const()[name = tensor("temb_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15904960)))]; tensor down_blocks_0_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16724224)))]; tensor temb_3_cast_fp16 = conv(bias = down_blocks_0_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_557, groups = var_112, pad = temb_3_pad_0, pad_type = temb_3_pad_type_0, strides = var_555, weight = down_blocks_0_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_3_cast_fp16")]; tensor input_43_cast_fp16 = add(x = hidden_states_19_cast_fp16, y = temb_3_cast_fp16)[name = tensor("input_43_cast_fp16")]; tensor reshape_16_shape_0 = const()[name = tensor("reshape_16_shape_0"), val = tensor([2, 32, 10, 48, 48])]; tensor reshape_16_cast_fp16 = reshape(shape = reshape_16_shape_0, x = input_43_cast_fp16)[name = tensor("reshape_16_cast_fp16")]; tensor reduce_mean_12_axes_0 = const()[name = tensor("reduce_mean_12_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_12_keep_dims_0 = const()[name = tensor("reduce_mean_12_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_12_cast_fp16 = reduce_mean(axes = reduce_mean_12_axes_0, keep_dims = reduce_mean_12_keep_dims_0, x = reshape_16_cast_fp16)[name = tensor("reduce_mean_12_cast_fp16")]; tensor sub_8_cast_fp16 = sub(x = reshape_16_cast_fp16, y = reduce_mean_12_cast_fp16)[name = tensor("sub_8_cast_fp16")]; tensor square_4_cast_fp16 = square(x = sub_8_cast_fp16)[name = tensor("square_4_cast_fp16")]; tensor reduce_mean_14_axes_0 = const()[name = tensor("reduce_mean_14_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_14_keep_dims_0 = const()[name = tensor("reduce_mean_14_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_14_cast_fp16 = reduce_mean(axes = reduce_mean_14_axes_0, keep_dims = reduce_mean_14_keep_dims_0, x = square_4_cast_fp16)[name = tensor("reduce_mean_14_cast_fp16")]; tensor add_8_y_0_to_fp16 = const()[name = tensor("add_8_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_8_cast_fp16 = add(x = reduce_mean_14_cast_fp16, y = add_8_y_0_to_fp16)[name = tensor("add_8_cast_fp16")]; tensor sqrt_4_cast_fp16 = sqrt(x = add_8_cast_fp16)[name = tensor("sqrt_4_cast_fp16")]; tensor real_div_4_cast_fp16 = real_div(x = sub_8_cast_fp16, y = sqrt_4_cast_fp16)[name = tensor("real_div_4_cast_fp16")]; tensor reshape_17_shape_0 = const()[name = tensor("reshape_17_shape_0"), val = tensor([2, 320, 48, 48])]; tensor reshape_17_cast_fp16 = reshape(shape = reshape_17_shape_0, x = real_div_4_cast_fp16)[name = tensor("reshape_17_cast_fp16")]; tensor add_9_gamma_0_to_fp16 = const()[name = tensor("add_9_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16724928)))]; tensor add_9_beta_0_to_fp16 = const()[name = tensor("add_9_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16725632)))]; tensor add_9_epsilon_0_to_fp16 = const()[name = tensor("add_9_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_9_cast_fp16 = batch_norm(beta = add_9_beta_0_to_fp16, epsilon = add_9_epsilon_0_to_fp16, gamma = add_9_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_17_cast_fp16)[name = tensor("add_9_cast_fp16")]; tensor input_47_cast_fp16 = silu(x = add_9_cast_fp16)[name = tensor("input_47_cast_fp16")]; tensor var_567 = const()[name = tensor("op_567"), val = tensor([1, 1])]; tensor var_569 = const()[name = tensor("op_569"), val = tensor([1, 1])]; tensor hidden_states_21_pad_type_0 = const()[name = tensor("hidden_states_21_pad_type_0"), val = tensor("custom")]; tensor hidden_states_21_pad_0 = const()[name = tensor("hidden_states_21_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_0_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16726336)))]; tensor down_blocks_0_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_0_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18569600)))]; tensor hidden_states_21_cast_fp16 = conv(bias = down_blocks_0_resnets_1_conv2_bias_to_fp16, dilations = var_569, groups = var_112, pad = hidden_states_21_pad_0, pad_type = hidden_states_21_pad_type_0, strides = var_567, weight = down_blocks_0_resnets_1_conv2_weight_to_fp16, x = input_47_cast_fp16)[name = tensor("hidden_states_21_cast_fp16")]; tensor hidden_states_23_cast_fp16 = add(x = input_35_cast_fp16_1, y = hidden_states_21_cast_fp16)[name = tensor("hidden_states_23_cast_fp16")]; tensor reshape_20_shape_0 = const()[name = tensor("reshape_20_shape_0"), val = tensor([2, 32, 10, 48, 48])]; tensor reshape_20_cast_fp16 = reshape(shape = reshape_20_shape_0, x = hidden_states_23_cast_fp16)[name = tensor("reshape_20_cast_fp16")]; tensor reduce_mean_15_axes_0 = const()[name = tensor("reduce_mean_15_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_15_keep_dims_0 = const()[name = tensor("reduce_mean_15_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_15_cast_fp16 = reduce_mean(axes = reduce_mean_15_axes_0, keep_dims = reduce_mean_15_keep_dims_0, x = reshape_20_cast_fp16)[name = tensor("reduce_mean_15_cast_fp16")]; tensor sub_10_cast_fp16 = sub(x = reshape_20_cast_fp16, y = reduce_mean_15_cast_fp16)[name = tensor("sub_10_cast_fp16")]; tensor square_5_cast_fp16 = square(x = sub_10_cast_fp16)[name = tensor("square_5_cast_fp16")]; tensor reduce_mean_17_axes_0 = const()[name = tensor("reduce_mean_17_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_17_keep_dims_0 = const()[name = tensor("reduce_mean_17_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_17_cast_fp16 = reduce_mean(axes = reduce_mean_17_axes_0, keep_dims = reduce_mean_17_keep_dims_0, x = square_5_cast_fp16)[name = tensor("reduce_mean_17_cast_fp16")]; tensor add_10_y_0_to_fp16 = const()[name = tensor("add_10_y_0_to_fp16"), val = tensor(0x1.1p-20)]; tensor add_10_cast_fp16 = add(x = reduce_mean_17_cast_fp16, y = add_10_y_0_to_fp16)[name = tensor("add_10_cast_fp16")]; tensor sqrt_5_cast_fp16 = sqrt(x = add_10_cast_fp16)[name = tensor("sqrt_5_cast_fp16")]; tensor real_div_5_cast_fp16 = real_div(x = sub_10_cast_fp16, y = sqrt_5_cast_fp16)[name = tensor("real_div_5_cast_fp16")]; tensor reshape_21_shape_0 = const()[name = tensor("reshape_21_shape_0"), val = tensor([2, 320, 48, 48])]; tensor reshape_21_cast_fp16 = reshape(shape = reshape_21_shape_0, x = real_div_5_cast_fp16)[name = tensor("reshape_21_cast_fp16")]; tensor add_11_gamma_0_to_fp16 = const()[name = tensor("add_11_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18570304)))]; tensor add_11_beta_0_to_fp16 = const()[name = tensor("add_11_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18571008)))]; tensor add_11_epsilon_0_to_fp16 = const()[name = tensor("add_11_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_11_cast_fp16 = batch_norm(beta = add_11_beta_0_to_fp16, epsilon = add_11_epsilon_0_to_fp16, gamma = add_11_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_21_cast_fp16)[name = tensor("add_11_cast_fp16")]; tensor var_589 = const()[name = tensor("op_589"), val = tensor([1, 1])]; tensor var_591 = const()[name = tensor("op_591"), val = tensor([1, 1])]; tensor hidden_states_25_pad_type_0 = const()[name = tensor("hidden_states_25_pad_type_0"), val = tensor("custom")]; tensor hidden_states_25_pad_0 = const()[name = tensor("hidden_states_25_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18571712)))]; tensor down_blocks_0_attentions_1_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18776576)))]; tensor hidden_states_25_cast_fp16 = conv(bias = down_blocks_0_attentions_1_proj_in_bias_to_fp16, dilations = var_591, groups = var_112, pad = hidden_states_25_pad_0, pad_type = hidden_states_25_pad_type_0, strides = var_589, weight = down_blocks_0_attentions_1_proj_in_weight_to_fp16, x = add_11_cast_fp16)[name = tensor("hidden_states_25_cast_fp16")]; tensor var_596 = const()[name = tensor("op_596"), val = tensor([2, 320, 1, 2304])]; tensor inputs_7_cast_fp16 = reshape(shape = var_596, x = hidden_states_25_cast_fp16)[name = tensor("inputs_7_cast_fp16")]; tensor var_606 = const()[name = tensor("op_606"), val = tensor([1])]; tensor channels_mean_7_cast_fp16 = reduce_mean(axes = var_606, keep_dims = var_107, x = inputs_7_cast_fp16)[name = tensor("channels_mean_7_cast_fp16")]; tensor zero_mean_7_cast_fp16 = sub(x = inputs_7_cast_fp16, y = channels_mean_7_cast_fp16)[name = tensor("zero_mean_7_cast_fp16")]; tensor zero_mean_sq_7_cast_fp16 = mul(x = zero_mean_7_cast_fp16, y = zero_mean_7_cast_fp16)[name = tensor("zero_mean_sq_7_cast_fp16")]; tensor var_610 = const()[name = tensor("op_610"), val = tensor([1])]; tensor var_611_cast_fp16 = reduce_mean(axes = var_610, keep_dims = var_107, x = zero_mean_sq_7_cast_fp16)[name = tensor("op_611_cast_fp16")]; tensor var_612_to_fp16 = const()[name = tensor("op_612_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_613_cast_fp16 = add(x = var_611_cast_fp16, y = var_612_to_fp16)[name = tensor("op_613_cast_fp16")]; tensor denom_7_epsilon_0_to_fp16 = const()[name = tensor("denom_7_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_7_cast_fp16 = rsqrt(epsilon = denom_7_epsilon_0_to_fp16, x = var_613_cast_fp16)[name = tensor("denom_7_cast_fp16")]; tensor out_7_cast_fp16 = mul(x = zero_mean_7_cast_fp16, y = denom_7_cast_fp16)[name = tensor("out_7_cast_fp16")]; tensor var_617_to_fp16 = const()[name = tensor("op_617_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18777280)))]; tensor var_618_cast_fp16 = add(x = out_7_cast_fp16, y = var_617_to_fp16)[name = tensor("op_618_cast_fp16")]; tensor var_620_to_fp16 = const()[name = tensor("op_620_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18777984)))]; tensor hidden_states_27_cast_fp16 = mul(x = var_618_cast_fp16, y = var_620_to_fp16)[name = tensor("hidden_states_27_cast_fp16")]; tensor var_627 = const()[name = tensor("op_627"), val = tensor([1, 1])]; tensor var_629 = const()[name = tensor("op_629"), val = tensor([1, 1])]; tensor q_5_pad_type_0 = const()[name = tensor("q_5_pad_type_0"), val = tensor("custom")]; tensor q_5_pad_0 = const()[name = tensor("q_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18778688)))]; tensor q_5_cast_fp16 = conv(dilations = var_629, groups = var_112, pad = q_5_pad_0, pad_type = q_5_pad_type_0, strides = var_627, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor("q_5_cast_fp16")]; tensor var_633 = const()[name = tensor("op_633"), val = tensor([1, 1])]; tensor var_635 = const()[name = tensor("op_635"), val = tensor([1, 1])]; tensor k_9_pad_type_0 = const()[name = tensor("k_9_pad_type_0"), val = tensor("custom")]; tensor k_9_pad_0 = const()[name = tensor("k_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18983552)))]; tensor k_9_cast_fp16 = conv(dilations = var_635, groups = var_112, pad = k_9_pad_0, pad_type = k_9_pad_type_0, strides = var_633, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor("k_9_cast_fp16")]; tensor var_639 = const()[name = tensor("op_639"), val = tensor([1, 1])]; tensor var_641 = const()[name = tensor("op_641"), val = tensor([1, 1])]; tensor v_5_pad_type_0 = const()[name = tensor("v_5_pad_type_0"), val = tensor("custom")]; tensor v_5_pad_0 = const()[name = tensor("v_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19188416)))]; tensor v_5_cast_fp16 = conv(dilations = var_641, groups = var_112, pad = v_5_pad_0, pad_type = v_5_pad_type_0, strides = var_639, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_27_cast_fp16)[name = tensor("v_5_cast_fp16")]; tensor var_645_begin_0 = const()[name = tensor("op_645_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_645_end_0 = const()[name = tensor("op_645_end_0"), val = tensor([2, 64, 1, 2304])]; tensor var_645_end_mask_0 = const()[name = tensor("op_645_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_645_cast_fp16 = slice_by_index(begin = var_645_begin_0, end = var_645_end_0, end_mask = var_645_end_mask_0, x = q_5_cast_fp16)[name = tensor("op_645_cast_fp16")]; tensor var_649_begin_0 = const()[name = tensor("op_649_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_649_end_0 = const()[name = tensor("op_649_end_0"), val = tensor([2, 128, 1, 2304])]; tensor var_649_end_mask_0 = const()[name = tensor("op_649_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_649_cast_fp16 = slice_by_index(begin = var_649_begin_0, end = var_649_end_0, end_mask = var_649_end_mask_0, x = q_5_cast_fp16)[name = tensor("op_649_cast_fp16")]; tensor var_653_begin_0 = const()[name = tensor("op_653_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_653_end_0 = const()[name = tensor("op_653_end_0"), val = tensor([2, 192, 1, 2304])]; tensor var_653_end_mask_0 = const()[name = tensor("op_653_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_653_cast_fp16 = slice_by_index(begin = var_653_begin_0, end = var_653_end_0, end_mask = var_653_end_mask_0, x = q_5_cast_fp16)[name = tensor("op_653_cast_fp16")]; tensor var_657_begin_0 = const()[name = tensor("op_657_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_657_end_0 = const()[name = tensor("op_657_end_0"), val = tensor([2, 256, 1, 2304])]; tensor var_657_end_mask_0 = const()[name = tensor("op_657_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_657_cast_fp16 = slice_by_index(begin = var_657_begin_0, end = var_657_end_0, end_mask = var_657_end_mask_0, x = q_5_cast_fp16)[name = tensor("op_657_cast_fp16")]; tensor var_661_begin_0 = const()[name = tensor("op_661_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_661_end_0 = const()[name = tensor("op_661_end_0"), val = tensor([2, 320, 1, 2304])]; tensor var_661_end_mask_0 = const()[name = tensor("op_661_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_661_cast_fp16 = slice_by_index(begin = var_661_begin_0, end = var_661_end_0, end_mask = var_661_end_mask_0, x = q_5_cast_fp16)[name = tensor("op_661_cast_fp16")]; tensor k_11_perm_0 = const()[name = tensor("k_11_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_668_begin_0 = const()[name = tensor("op_668_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_668_end_0 = const()[name = tensor("op_668_end_0"), val = tensor([2, 2304, 1, 64])]; tensor var_668_end_mask_0 = const()[name = tensor("op_668_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_11 = transpose(perm = k_11_perm_0, x = k_9_cast_fp16)[name = tensor("transpose_11")]; tensor var_668_cast_fp16 = slice_by_index(begin = var_668_begin_0, end = var_668_end_0, end_mask = var_668_end_mask_0, x = transpose_11)[name = tensor("op_668_cast_fp16")]; tensor var_672_begin_0 = const()[name = tensor("op_672_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_672_end_0 = const()[name = tensor("op_672_end_0"), val = tensor([2, 2304, 1, 128])]; tensor var_672_end_mask_0 = const()[name = tensor("op_672_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_672_cast_fp16 = slice_by_index(begin = var_672_begin_0, end = var_672_end_0, end_mask = var_672_end_mask_0, x = transpose_11)[name = tensor("op_672_cast_fp16")]; tensor var_676_begin_0 = const()[name = tensor("op_676_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_676_end_0 = const()[name = tensor("op_676_end_0"), val = tensor([2, 2304, 1, 192])]; tensor var_676_end_mask_0 = const()[name = tensor("op_676_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_676_cast_fp16 = slice_by_index(begin = var_676_begin_0, end = var_676_end_0, end_mask = var_676_end_mask_0, x = transpose_11)[name = tensor("op_676_cast_fp16")]; tensor var_680_begin_0 = const()[name = tensor("op_680_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_680_end_0 = const()[name = tensor("op_680_end_0"), val = tensor([2, 2304, 1, 256])]; tensor var_680_end_mask_0 = const()[name = tensor("op_680_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_680_cast_fp16 = slice_by_index(begin = var_680_begin_0, end = var_680_end_0, end_mask = var_680_end_mask_0, x = transpose_11)[name = tensor("op_680_cast_fp16")]; tensor var_684_begin_0 = const()[name = tensor("op_684_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_684_end_0 = const()[name = tensor("op_684_end_0"), val = tensor([2, 2304, 1, 320])]; tensor var_684_end_mask_0 = const()[name = tensor("op_684_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_684_cast_fp16 = slice_by_index(begin = var_684_begin_0, end = var_684_end_0, end_mask = var_684_end_mask_0, x = transpose_11)[name = tensor("op_684_cast_fp16")]; tensor var_686_begin_0 = const()[name = tensor("op_686_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_686_end_0 = const()[name = tensor("op_686_end_0"), val = tensor([2, 64, 1, 2304])]; tensor var_686_end_mask_0 = const()[name = tensor("op_686_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_686_cast_fp16 = slice_by_index(begin = var_686_begin_0, end = var_686_end_0, end_mask = var_686_end_mask_0, x = v_5_cast_fp16)[name = tensor("op_686_cast_fp16")]; tensor var_690_begin_0 = const()[name = tensor("op_690_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_690_end_0 = const()[name = tensor("op_690_end_0"), val = tensor([2, 128, 1, 2304])]; tensor var_690_end_mask_0 = const()[name = tensor("op_690_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_690_cast_fp16 = slice_by_index(begin = var_690_begin_0, end = var_690_end_0, end_mask = var_690_end_mask_0, x = v_5_cast_fp16)[name = tensor("op_690_cast_fp16")]; tensor var_694_begin_0 = const()[name = tensor("op_694_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_694_end_0 = const()[name = tensor("op_694_end_0"), val = tensor([2, 192, 1, 2304])]; tensor var_694_end_mask_0 = const()[name = tensor("op_694_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_694_cast_fp16 = slice_by_index(begin = var_694_begin_0, end = var_694_end_0, end_mask = var_694_end_mask_0, x = v_5_cast_fp16)[name = tensor("op_694_cast_fp16")]; tensor var_698_begin_0 = const()[name = tensor("op_698_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_698_end_0 = const()[name = tensor("op_698_end_0"), val = tensor([2, 256, 1, 2304])]; tensor var_698_end_mask_0 = const()[name = tensor("op_698_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_698_cast_fp16 = slice_by_index(begin = var_698_begin_0, end = var_698_end_0, end_mask = var_698_end_mask_0, x = v_5_cast_fp16)[name = tensor("op_698_cast_fp16")]; tensor var_702_begin_0 = const()[name = tensor("op_702_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_702_end_0 = const()[name = tensor("op_702_end_0"), val = tensor([2, 320, 1, 2304])]; tensor var_702_end_mask_0 = const()[name = tensor("op_702_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_702_cast_fp16 = slice_by_index(begin = var_702_begin_0, end = var_702_end_0, end_mask = var_702_end_mask_0, x = v_5_cast_fp16)[name = tensor("op_702_cast_fp16")]; tensor var_706_equation_0 = const()[name = tensor("op_706_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_706_cast_fp16 = einsum(equation = var_706_equation_0, values = (var_668_cast_fp16, var_645_cast_fp16))[name = tensor("op_706_cast_fp16")]; tensor var_707_to_fp16 = const()[name = tensor("op_707_to_fp16"), val = tensor(0x1p-3)]; tensor aw_21_cast_fp16 = mul(x = var_706_cast_fp16, y = var_707_to_fp16)[name = tensor("aw_21_cast_fp16")]; tensor var_710_equation_0 = const()[name = tensor("op_710_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_710_cast_fp16 = einsum(equation = var_710_equation_0, values = (var_672_cast_fp16, var_649_cast_fp16))[name = tensor("op_710_cast_fp16")]; tensor var_711_to_fp16 = const()[name = tensor("op_711_to_fp16"), val = tensor(0x1p-3)]; tensor aw_23_cast_fp16 = mul(x = var_710_cast_fp16, y = var_711_to_fp16)[name = tensor("aw_23_cast_fp16")]; tensor var_714_equation_0 = const()[name = tensor("op_714_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_714_cast_fp16 = einsum(equation = var_714_equation_0, values = (var_676_cast_fp16, var_653_cast_fp16))[name = tensor("op_714_cast_fp16")]; tensor var_715_to_fp16 = const()[name = tensor("op_715_to_fp16"), val = tensor(0x1p-3)]; tensor aw_25_cast_fp16 = mul(x = var_714_cast_fp16, y = var_715_to_fp16)[name = tensor("aw_25_cast_fp16")]; tensor var_718_equation_0 = const()[name = tensor("op_718_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_718_cast_fp16 = einsum(equation = var_718_equation_0, values = (var_680_cast_fp16, var_657_cast_fp16))[name = tensor("op_718_cast_fp16")]; tensor var_719_to_fp16 = const()[name = tensor("op_719_to_fp16"), val = tensor(0x1p-3)]; tensor aw_27_cast_fp16 = mul(x = var_718_cast_fp16, y = var_719_to_fp16)[name = tensor("aw_27_cast_fp16")]; tensor var_722_equation_0 = const()[name = tensor("op_722_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_722_cast_fp16 = einsum(equation = var_722_equation_0, values = (var_684_cast_fp16, var_661_cast_fp16))[name = tensor("op_722_cast_fp16")]; tensor var_723_to_fp16 = const()[name = tensor("op_723_to_fp16"), val = tensor(0x1p-3)]; tensor aw_29_cast_fp16 = mul(x = var_722_cast_fp16, y = var_723_to_fp16)[name = tensor("aw_29_cast_fp16")]; tensor var_725_cast_fp16 = softmax(axis = var_112, x = aw_21_cast_fp16)[name = tensor("op_725_cast_fp16")]; tensor var_726_cast_fp16 = softmax(axis = var_112, x = aw_23_cast_fp16)[name = tensor("op_726_cast_fp16")]; tensor var_727_cast_fp16 = softmax(axis = var_112, x = aw_25_cast_fp16)[name = tensor("op_727_cast_fp16")]; tensor var_728_cast_fp16 = softmax(axis = var_112, x = aw_27_cast_fp16)[name = tensor("op_728_cast_fp16")]; tensor var_729_cast_fp16 = softmax(axis = var_112, x = aw_29_cast_fp16)[name = tensor("op_729_cast_fp16")]; tensor var_731_equation_0 = const()[name = tensor("op_731_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_731_cast_fp16 = einsum(equation = var_731_equation_0, values = (var_686_cast_fp16, var_725_cast_fp16))[name = tensor("op_731_cast_fp16")]; tensor var_733_equation_0 = const()[name = tensor("op_733_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_733_cast_fp16 = einsum(equation = var_733_equation_0, values = (var_690_cast_fp16, var_726_cast_fp16))[name = tensor("op_733_cast_fp16")]; tensor var_735_equation_0 = const()[name = tensor("op_735_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_735_cast_fp16 = einsum(equation = var_735_equation_0, values = (var_694_cast_fp16, var_727_cast_fp16))[name = tensor("op_735_cast_fp16")]; tensor var_737_equation_0 = const()[name = tensor("op_737_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_737_cast_fp16 = einsum(equation = var_737_equation_0, values = (var_698_cast_fp16, var_728_cast_fp16))[name = tensor("op_737_cast_fp16")]; tensor var_739_equation_0 = const()[name = tensor("op_739_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_739_cast_fp16 = einsum(equation = var_739_equation_0, values = (var_702_cast_fp16, var_729_cast_fp16))[name = tensor("op_739_cast_fp16")]; tensor input_51_interleave_0 = const()[name = tensor("input_51_interleave_0"), val = tensor(false)]; tensor input_51_cast_fp16 = concat(axis = var_112, interleave = input_51_interleave_0, values = (var_731_cast_fp16, var_733_cast_fp16, var_735_cast_fp16, var_737_cast_fp16, var_739_cast_fp16))[name = tensor("input_51_cast_fp16")]; tensor var_745 = const()[name = tensor("op_745"), val = tensor([1, 1])]; tensor var_747 = const()[name = tensor("op_747"), val = tensor([1, 1])]; tensor var_749_pad_type_0 = const()[name = tensor("op_749_pad_type_0"), val = tensor("custom")]; tensor var_749_pad_0 = const()[name = tensor("op_749_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19393280)))]; tensor down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19598144)))]; tensor var_749_cast_fp16 = conv(bias = down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_747, groups = var_112, pad = var_749_pad_0, pad_type = var_749_pad_type_0, strides = var_745, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_51_cast_fp16)[name = tensor("op_749_cast_fp16")]; tensor inputs_9_cast_fp16 = add(x = var_749_cast_fp16, y = inputs_7_cast_fp16)[name = tensor("inputs_9_cast_fp16")]; tensor var_753 = const()[name = tensor("op_753"), val = tensor([1])]; tensor channels_mean_9_cast_fp16 = reduce_mean(axes = var_753, keep_dims = var_107, x = inputs_9_cast_fp16)[name = tensor("channels_mean_9_cast_fp16")]; tensor zero_mean_9_cast_fp16 = sub(x = inputs_9_cast_fp16, y = channels_mean_9_cast_fp16)[name = tensor("zero_mean_9_cast_fp16")]; tensor zero_mean_sq_9_cast_fp16 = mul(x = zero_mean_9_cast_fp16, y = zero_mean_9_cast_fp16)[name = tensor("zero_mean_sq_9_cast_fp16")]; tensor var_757 = const()[name = tensor("op_757"), val = tensor([1])]; tensor var_758_cast_fp16 = reduce_mean(axes = var_757, keep_dims = var_107, x = zero_mean_sq_9_cast_fp16)[name = tensor("op_758_cast_fp16")]; tensor var_759_to_fp16 = const()[name = tensor("op_759_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_760_cast_fp16 = add(x = var_758_cast_fp16, y = var_759_to_fp16)[name = tensor("op_760_cast_fp16")]; tensor denom_9_epsilon_0_to_fp16 = const()[name = tensor("denom_9_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_9_cast_fp16 = rsqrt(epsilon = denom_9_epsilon_0_to_fp16, x = var_760_cast_fp16)[name = tensor("denom_9_cast_fp16")]; tensor out_9_cast_fp16 = mul(x = zero_mean_9_cast_fp16, y = denom_9_cast_fp16)[name = tensor("out_9_cast_fp16")]; tensor var_764_to_fp16 = const()[name = tensor("op_764_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19598848)))]; tensor var_765_cast_fp16 = add(x = out_9_cast_fp16, y = var_764_to_fp16)[name = tensor("op_765_cast_fp16")]; tensor var_767_to_fp16 = const()[name = tensor("op_767_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19599552)))]; tensor hidden_states_29_cast_fp16 = mul(x = var_765_cast_fp16, y = var_767_to_fp16)[name = tensor("hidden_states_29_cast_fp16")]; tensor var_774 = const()[name = tensor("op_774"), val = tensor([1, 1])]; tensor var_776 = const()[name = tensor("op_776"), val = tensor([1, 1])]; tensor q_7_pad_type_0 = const()[name = tensor("q_7_pad_type_0"), val = tensor("custom")]; tensor q_7_pad_0 = const()[name = tensor("q_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19600256)))]; tensor q_7_cast_fp16 = conv(dilations = var_776, groups = var_112, pad = q_7_pad_0, pad_type = q_7_pad_type_0, strides = var_774, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_29_cast_fp16)[name = tensor("q_7_cast_fp16")]; tensor var_780 = const()[name = tensor("op_780"), val = tensor([1, 1])]; tensor var_782 = const()[name = tensor("op_782"), val = tensor([1, 1])]; tensor k_13_pad_type_0 = const()[name = tensor("k_13_pad_type_0"), val = tensor("custom")]; tensor k_13_pad_0 = const()[name = tensor("k_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(19805120)))]; tensor k_13_cast_fp16 = conv(dilations = var_782, groups = var_112, pad = k_13_pad_0, pad_type = k_13_pad_type_0, strides = var_780, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_13_cast_fp16")]; tensor var_786 = const()[name = tensor("op_786"), val = tensor([1, 1])]; tensor var_788 = const()[name = tensor("op_788"), val = tensor([1, 1])]; tensor v_7_pad_type_0 = const()[name = tensor("v_7_pad_type_0"), val = tensor("custom")]; tensor v_7_pad_0 = const()[name = tensor("v_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20460544)))]; tensor v_7_cast_fp16 = conv(dilations = var_788, groups = var_112, pad = v_7_pad_0, pad_type = v_7_pad_type_0, strides = var_786, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_7_cast_fp16")]; tensor var_792_begin_0 = const()[name = tensor("op_792_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_792_end_0 = const()[name = tensor("op_792_end_0"), val = tensor([2, 64, 1, 2304])]; tensor var_792_end_mask_0 = const()[name = tensor("op_792_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_792_cast_fp16 = slice_by_index(begin = var_792_begin_0, end = var_792_end_0, end_mask = var_792_end_mask_0, x = q_7_cast_fp16)[name = tensor("op_792_cast_fp16")]; tensor var_796_begin_0 = const()[name = tensor("op_796_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_796_end_0 = const()[name = tensor("op_796_end_0"), val = tensor([2, 128, 1, 2304])]; tensor var_796_end_mask_0 = const()[name = tensor("op_796_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_796_cast_fp16 = slice_by_index(begin = var_796_begin_0, end = var_796_end_0, end_mask = var_796_end_mask_0, x = q_7_cast_fp16)[name = tensor("op_796_cast_fp16")]; tensor var_800_begin_0 = const()[name = tensor("op_800_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_800_end_0 = const()[name = tensor("op_800_end_0"), val = tensor([2, 192, 1, 2304])]; tensor var_800_end_mask_0 = const()[name = tensor("op_800_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_800_cast_fp16 = slice_by_index(begin = var_800_begin_0, end = var_800_end_0, end_mask = var_800_end_mask_0, x = q_7_cast_fp16)[name = tensor("op_800_cast_fp16")]; tensor var_804_begin_0 = const()[name = tensor("op_804_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_804_end_0 = const()[name = tensor("op_804_end_0"), val = tensor([2, 256, 1, 2304])]; tensor var_804_end_mask_0 = const()[name = tensor("op_804_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_804_cast_fp16 = slice_by_index(begin = var_804_begin_0, end = var_804_end_0, end_mask = var_804_end_mask_0, x = q_7_cast_fp16)[name = tensor("op_804_cast_fp16")]; tensor var_808_begin_0 = const()[name = tensor("op_808_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_808_end_0 = const()[name = tensor("op_808_end_0"), val = tensor([2, 320, 1, 2304])]; tensor var_808_end_mask_0 = const()[name = tensor("op_808_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_808_cast_fp16 = slice_by_index(begin = var_808_begin_0, end = var_808_end_0, end_mask = var_808_end_mask_0, x = q_7_cast_fp16)[name = tensor("op_808_cast_fp16")]; tensor k_15_perm_0 = const()[name = tensor("k_15_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_815_begin_0 = const()[name = tensor("op_815_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_815_end_0 = const()[name = tensor("op_815_end_0"), val = tensor([2, 77, 1, 64])]; tensor var_815_end_mask_0 = const()[name = tensor("op_815_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_10 = transpose(perm = k_15_perm_0, x = k_13_cast_fp16)[name = tensor("transpose_10")]; tensor var_815_cast_fp16 = slice_by_index(begin = var_815_begin_0, end = var_815_end_0, end_mask = var_815_end_mask_0, x = transpose_10)[name = tensor("op_815_cast_fp16")]; tensor var_819_begin_0 = const()[name = tensor("op_819_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_819_end_0 = const()[name = tensor("op_819_end_0"), val = tensor([2, 77, 1, 128])]; tensor var_819_end_mask_0 = const()[name = tensor("op_819_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_819_cast_fp16 = slice_by_index(begin = var_819_begin_0, end = var_819_end_0, end_mask = var_819_end_mask_0, x = transpose_10)[name = tensor("op_819_cast_fp16")]; tensor var_823_begin_0 = const()[name = tensor("op_823_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_823_end_0 = const()[name = tensor("op_823_end_0"), val = tensor([2, 77, 1, 192])]; tensor var_823_end_mask_0 = const()[name = tensor("op_823_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_823_cast_fp16 = slice_by_index(begin = var_823_begin_0, end = var_823_end_0, end_mask = var_823_end_mask_0, x = transpose_10)[name = tensor("op_823_cast_fp16")]; tensor var_827_begin_0 = const()[name = tensor("op_827_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_827_end_0 = const()[name = tensor("op_827_end_0"), val = tensor([2, 77, 1, 256])]; tensor var_827_end_mask_0 = const()[name = tensor("op_827_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_827_cast_fp16 = slice_by_index(begin = var_827_begin_0, end = var_827_end_0, end_mask = var_827_end_mask_0, x = transpose_10)[name = tensor("op_827_cast_fp16")]; tensor var_831_begin_0 = const()[name = tensor("op_831_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_831_end_0 = const()[name = tensor("op_831_end_0"), val = tensor([2, 77, 1, 320])]; tensor var_831_end_mask_0 = const()[name = tensor("op_831_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_831_cast_fp16 = slice_by_index(begin = var_831_begin_0, end = var_831_end_0, end_mask = var_831_end_mask_0, x = transpose_10)[name = tensor("op_831_cast_fp16")]; tensor var_833_begin_0 = const()[name = tensor("op_833_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_833_end_0 = const()[name = tensor("op_833_end_0"), val = tensor([2, 64, 1, 77])]; tensor var_833_end_mask_0 = const()[name = tensor("op_833_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_833_cast_fp16 = slice_by_index(begin = var_833_begin_0, end = var_833_end_0, end_mask = var_833_end_mask_0, x = v_7_cast_fp16)[name = tensor("op_833_cast_fp16")]; tensor var_837_begin_0 = const()[name = tensor("op_837_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_837_end_0 = const()[name = tensor("op_837_end_0"), val = tensor([2, 128, 1, 77])]; tensor var_837_end_mask_0 = const()[name = tensor("op_837_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_837_cast_fp16 = slice_by_index(begin = var_837_begin_0, end = var_837_end_0, end_mask = var_837_end_mask_0, x = v_7_cast_fp16)[name = tensor("op_837_cast_fp16")]; tensor var_841_begin_0 = const()[name = tensor("op_841_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_841_end_0 = const()[name = tensor("op_841_end_0"), val = tensor([2, 192, 1, 77])]; tensor var_841_end_mask_0 = const()[name = tensor("op_841_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_841_cast_fp16 = slice_by_index(begin = var_841_begin_0, end = var_841_end_0, end_mask = var_841_end_mask_0, x = v_7_cast_fp16)[name = tensor("op_841_cast_fp16")]; tensor var_845_begin_0 = const()[name = tensor("op_845_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_845_end_0 = const()[name = tensor("op_845_end_0"), val = tensor([2, 256, 1, 77])]; tensor var_845_end_mask_0 = const()[name = tensor("op_845_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_845_cast_fp16 = slice_by_index(begin = var_845_begin_0, end = var_845_end_0, end_mask = var_845_end_mask_0, x = v_7_cast_fp16)[name = tensor("op_845_cast_fp16")]; tensor var_849_begin_0 = const()[name = tensor("op_849_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_849_end_0 = const()[name = tensor("op_849_end_0"), val = tensor([2, 320, 1, 77])]; tensor var_849_end_mask_0 = const()[name = tensor("op_849_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_849_cast_fp16 = slice_by_index(begin = var_849_begin_0, end = var_849_end_0, end_mask = var_849_end_mask_0, x = v_7_cast_fp16)[name = tensor("op_849_cast_fp16")]; tensor var_853_equation_0 = const()[name = tensor("op_853_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_853_cast_fp16 = einsum(equation = var_853_equation_0, values = (var_815_cast_fp16, var_792_cast_fp16))[name = tensor("op_853_cast_fp16")]; tensor var_854_to_fp16 = const()[name = tensor("op_854_to_fp16"), val = tensor(0x1p-3)]; tensor aw_31_cast_fp16 = mul(x = var_853_cast_fp16, y = var_854_to_fp16)[name = tensor("aw_31_cast_fp16")]; tensor var_857_equation_0 = const()[name = tensor("op_857_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_857_cast_fp16 = einsum(equation = var_857_equation_0, values = (var_819_cast_fp16, var_796_cast_fp16))[name = tensor("op_857_cast_fp16")]; tensor var_858_to_fp16 = const()[name = tensor("op_858_to_fp16"), val = tensor(0x1p-3)]; tensor aw_33_cast_fp16 = mul(x = var_857_cast_fp16, y = var_858_to_fp16)[name = tensor("aw_33_cast_fp16")]; tensor var_861_equation_0 = const()[name = tensor("op_861_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_861_cast_fp16 = einsum(equation = var_861_equation_0, values = (var_823_cast_fp16, var_800_cast_fp16))[name = tensor("op_861_cast_fp16")]; tensor var_862_to_fp16 = const()[name = tensor("op_862_to_fp16"), val = tensor(0x1p-3)]; tensor aw_35_cast_fp16 = mul(x = var_861_cast_fp16, y = var_862_to_fp16)[name = tensor("aw_35_cast_fp16")]; tensor var_865_equation_0 = const()[name = tensor("op_865_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_865_cast_fp16 = einsum(equation = var_865_equation_0, values = (var_827_cast_fp16, var_804_cast_fp16))[name = tensor("op_865_cast_fp16")]; tensor var_866_to_fp16 = const()[name = tensor("op_866_to_fp16"), val = tensor(0x1p-3)]; tensor aw_37_cast_fp16 = mul(x = var_865_cast_fp16, y = var_866_to_fp16)[name = tensor("aw_37_cast_fp16")]; tensor var_869_equation_0 = const()[name = tensor("op_869_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_869_cast_fp16 = einsum(equation = var_869_equation_0, values = (var_831_cast_fp16, var_808_cast_fp16))[name = tensor("op_869_cast_fp16")]; tensor var_870_to_fp16 = const()[name = tensor("op_870_to_fp16"), val = tensor(0x1p-3)]; tensor aw_39_cast_fp16 = mul(x = var_869_cast_fp16, y = var_870_to_fp16)[name = tensor("aw_39_cast_fp16")]; tensor var_872_cast_fp16 = softmax(axis = var_112, x = aw_31_cast_fp16)[name = tensor("op_872_cast_fp16")]; tensor var_873_cast_fp16 = softmax(axis = var_112, x = aw_33_cast_fp16)[name = tensor("op_873_cast_fp16")]; tensor var_874_cast_fp16 = softmax(axis = var_112, x = aw_35_cast_fp16)[name = tensor("op_874_cast_fp16")]; tensor var_875_cast_fp16 = softmax(axis = var_112, x = aw_37_cast_fp16)[name = tensor("op_875_cast_fp16")]; tensor var_876_cast_fp16 = softmax(axis = var_112, x = aw_39_cast_fp16)[name = tensor("op_876_cast_fp16")]; tensor var_878_equation_0 = const()[name = tensor("op_878_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_878_cast_fp16 = einsum(equation = var_878_equation_0, values = (var_833_cast_fp16, var_872_cast_fp16))[name = tensor("op_878_cast_fp16")]; tensor var_880_equation_0 = const()[name = tensor("op_880_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_880_cast_fp16 = einsum(equation = var_880_equation_0, values = (var_837_cast_fp16, var_873_cast_fp16))[name = tensor("op_880_cast_fp16")]; tensor var_882_equation_0 = const()[name = tensor("op_882_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_882_cast_fp16 = einsum(equation = var_882_equation_0, values = (var_841_cast_fp16, var_874_cast_fp16))[name = tensor("op_882_cast_fp16")]; tensor var_884_equation_0 = const()[name = tensor("op_884_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_884_cast_fp16 = einsum(equation = var_884_equation_0, values = (var_845_cast_fp16, var_875_cast_fp16))[name = tensor("op_884_cast_fp16")]; tensor var_886_equation_0 = const()[name = tensor("op_886_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_886_cast_fp16 = einsum(equation = var_886_equation_0, values = (var_849_cast_fp16, var_876_cast_fp16))[name = tensor("op_886_cast_fp16")]; tensor input_53_interleave_0 = const()[name = tensor("input_53_interleave_0"), val = tensor(false)]; tensor input_53_cast_fp16 = concat(axis = var_112, interleave = input_53_interleave_0, values = (var_878_cast_fp16, var_880_cast_fp16, var_882_cast_fp16, var_884_cast_fp16, var_886_cast_fp16))[name = tensor("input_53_cast_fp16")]; tensor var_892 = const()[name = tensor("op_892"), val = tensor([1, 1])]; tensor var_894 = const()[name = tensor("op_894"), val = tensor([1, 1])]; tensor var_896_pad_type_0 = const()[name = tensor("op_896_pad_type_0"), val = tensor("custom")]; tensor var_896_pad_0 = const()[name = tensor("op_896_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21115968)))]; tensor down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21320832)))]; tensor var_896_cast_fp16 = conv(bias = down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_894, groups = var_112, pad = var_896_pad_0, pad_type = var_896_pad_type_0, strides = var_892, weight = down_blocks_0_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_53_cast_fp16)[name = tensor("op_896_cast_fp16")]; tensor inputs_11_cast_fp16 = add(x = var_896_cast_fp16, y = inputs_9_cast_fp16)[name = tensor("inputs_11_cast_fp16")]; tensor var_900 = const()[name = tensor("op_900"), val = tensor([1])]; tensor channels_mean_11_cast_fp16 = reduce_mean(axes = var_900, keep_dims = var_107, x = inputs_11_cast_fp16)[name = tensor("channels_mean_11_cast_fp16")]; tensor zero_mean_11_cast_fp16 = sub(x = inputs_11_cast_fp16, y = channels_mean_11_cast_fp16)[name = tensor("zero_mean_11_cast_fp16")]; tensor zero_mean_sq_11_cast_fp16 = mul(x = zero_mean_11_cast_fp16, y = zero_mean_11_cast_fp16)[name = tensor("zero_mean_sq_11_cast_fp16")]; tensor var_904 = const()[name = tensor("op_904"), val = tensor([1])]; tensor var_905_cast_fp16 = reduce_mean(axes = var_904, keep_dims = var_107, x = zero_mean_sq_11_cast_fp16)[name = tensor("op_905_cast_fp16")]; tensor var_906_to_fp16 = const()[name = tensor("op_906_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_907_cast_fp16 = add(x = var_905_cast_fp16, y = var_906_to_fp16)[name = tensor("op_907_cast_fp16")]; tensor denom_11_epsilon_0_to_fp16 = const()[name = tensor("denom_11_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_11_cast_fp16 = rsqrt(epsilon = denom_11_epsilon_0_to_fp16, x = var_907_cast_fp16)[name = tensor("denom_11_cast_fp16")]; tensor out_11_cast_fp16 = mul(x = zero_mean_11_cast_fp16, y = denom_11_cast_fp16)[name = tensor("out_11_cast_fp16")]; tensor var_911_to_fp16 = const()[name = tensor("op_911_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21321536)))]; tensor var_912_cast_fp16 = add(x = out_11_cast_fp16, y = var_911_to_fp16)[name = tensor("op_912_cast_fp16")]; tensor var_914_to_fp16 = const()[name = tensor("op_914_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21322240)))]; tensor input_55_cast_fp16 = mul(x = var_912_cast_fp16, y = var_914_to_fp16)[name = tensor("input_55_cast_fp16")]; tensor var_922 = const()[name = tensor("op_922"), val = tensor([1, 1])]; tensor var_924 = const()[name = tensor("op_924"), val = tensor([1, 1])]; tensor var_926_pad_type_0 = const()[name = tensor("op_926_pad_type_0"), val = tensor("custom")]; tensor var_926_pad_0 = const()[name = tensor("op_926_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(21322944)))]; tensor down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22961408)))]; tensor var_926_cast_fp16 = conv(bias = down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_924, groups = var_112, pad = var_926_pad_0, pad_type = var_926_pad_type_0, strides = var_922, weight = down_blocks_0_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_55_cast_fp16)[name = tensor("op_926_cast_fp16")]; tensor var_927_split_sizes_0 = const()[name = tensor("op_927_split_sizes_0"), val = tensor([1280, 1280])]; tensor var_927_axis_0 = const()[name = tensor("op_927_axis_0"), val = tensor(1)]; tensor var_927_cast_fp16_0, tensor var_927_cast_fp16_1 = split(axis = var_927_axis_0, split_sizes = var_927_split_sizes_0, x = var_926_cast_fp16)[name = tensor("op_927_cast_fp16")]; tensor var_929_mode_0 = const()[name = tensor("op_929_mode_0"), val = tensor("EXACT")]; tensor var_929_cast_fp16 = gelu(mode = var_929_mode_0, x = var_927_cast_fp16_1)[name = tensor("op_929_cast_fp16")]; tensor input_57_cast_fp16 = mul(x = var_927_cast_fp16_0, y = var_929_cast_fp16)[name = tensor("input_57_cast_fp16")]; tensor var_933 = const()[name = tensor("op_933"), val = tensor([1, 1])]; tensor var_935 = const()[name = tensor("op_935"), val = tensor([1, 1])]; tensor var_937_pad_type_0 = const()[name = tensor("op_937_pad_type_0"), val = tensor("custom")]; tensor var_937_pad_0 = const()[name = tensor("op_937_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22966592)))]; tensor down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23785856)))]; tensor var_937_cast_fp16 = conv(bias = down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_935, groups = var_112, pad = var_937_pad_0, pad_type = var_937_pad_type_0, strides = var_933, weight = down_blocks_0_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_57_cast_fp16)[name = tensor("op_937_cast_fp16")]; tensor hidden_states_33_cast_fp16 = add(x = var_937_cast_fp16, y = inputs_11_cast_fp16)[name = tensor("hidden_states_33_cast_fp16")]; tensor var_939 = const()[name = tensor("op_939"), val = tensor([2, 320, 48, 48])]; tensor input_59_cast_fp16 = reshape(shape = var_939, x = hidden_states_33_cast_fp16)[name = tensor("input_59_cast_fp16")]; tensor var_943 = const()[name = tensor("op_943"), val = tensor([1, 1])]; tensor var_945 = const()[name = tensor("op_945"), val = tensor([1, 1])]; tensor hidden_states_35_pad_type_0 = const()[name = tensor("hidden_states_35_pad_type_0"), val = tensor("custom")]; tensor hidden_states_35_pad_0 = const()[name = tensor("hidden_states_35_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_0_attentions_1_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23786560)))]; tensor down_blocks_0_attentions_1_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_0_attentions_1_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23991424)))]; tensor hidden_states_35_cast_fp16 = conv(bias = down_blocks_0_attentions_1_proj_out_bias_to_fp16, dilations = var_945, groups = var_112, pad = hidden_states_35_pad_0, pad_type = hidden_states_35_pad_type_0, strides = var_943, weight = down_blocks_0_attentions_1_proj_out_weight_to_fp16, x = input_59_cast_fp16)[name = tensor("hidden_states_35_cast_fp16")]; tensor input_61_cast_fp16_1 = add(x = hidden_states_35_cast_fp16, y = hidden_states_23_cast_fp16)[name = tensor("input_61_cast_fp16")]; tensor var_952 = const()[name = tensor("op_952"), val = tensor([2, 2])]; tensor var_954 = const()[name = tensor("op_954"), val = tensor([1, 1])]; tensor input_63_pad_type_0 = const()[name = tensor("input_63_pad_type_0"), val = tensor("custom")]; tensor input_63_pad_0 = const()[name = tensor("input_63_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_0_downsamplers_0_conv_weight_to_fp16 = const()[name = tensor("down_blocks_0_downsamplers_0_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23992128)))]; tensor down_blocks_0_downsamplers_0_conv_bias_to_fp16 = const()[name = tensor("down_blocks_0_downsamplers_0_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25835392)))]; tensor input_63_cast_fp16_1 = conv(bias = down_blocks_0_downsamplers_0_conv_bias_to_fp16, dilations = var_954, groups = var_112, pad = input_63_pad_0, pad_type = input_63_pad_type_0, strides = var_952, weight = down_blocks_0_downsamplers_0_conv_weight_to_fp16, x = input_61_cast_fp16_1)[name = tensor("input_63_cast_fp16")]; tensor var_979 = const()[name = tensor("op_979"), val = tensor(true)]; tensor var_984 = const()[name = tensor("op_984"), val = tensor(1)]; tensor reshape_24_shape_0 = const()[name = tensor("reshape_24_shape_0"), val = tensor([2, 32, 10, 24, 24])]; tensor reshape_24_cast_fp16 = reshape(shape = reshape_24_shape_0, x = input_63_cast_fp16_1)[name = tensor("reshape_24_cast_fp16")]; tensor reduce_mean_18_axes_0 = const()[name = tensor("reduce_mean_18_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_18_keep_dims_0 = const()[name = tensor("reduce_mean_18_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_18_cast_fp16 = reduce_mean(axes = reduce_mean_18_axes_0, keep_dims = reduce_mean_18_keep_dims_0, x = reshape_24_cast_fp16)[name = tensor("reduce_mean_18_cast_fp16")]; tensor sub_12_cast_fp16 = sub(x = reshape_24_cast_fp16, y = reduce_mean_18_cast_fp16)[name = tensor("sub_12_cast_fp16")]; tensor square_6_cast_fp16 = square(x = sub_12_cast_fp16)[name = tensor("square_6_cast_fp16")]; tensor reduce_mean_20_axes_0 = const()[name = tensor("reduce_mean_20_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_20_keep_dims_0 = const()[name = tensor("reduce_mean_20_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_20_cast_fp16 = reduce_mean(axes = reduce_mean_20_axes_0, keep_dims = reduce_mean_20_keep_dims_0, x = square_6_cast_fp16)[name = tensor("reduce_mean_20_cast_fp16")]; tensor add_12_y_0_to_fp16 = const()[name = tensor("add_12_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_12_cast_fp16 = add(x = reduce_mean_20_cast_fp16, y = add_12_y_0_to_fp16)[name = tensor("add_12_cast_fp16")]; tensor sqrt_6_cast_fp16 = sqrt(x = add_12_cast_fp16)[name = tensor("sqrt_6_cast_fp16")]; tensor real_div_6_cast_fp16 = real_div(x = sub_12_cast_fp16, y = sqrt_6_cast_fp16)[name = tensor("real_div_6_cast_fp16")]; tensor reshape_25_shape_0 = const()[name = tensor("reshape_25_shape_0"), val = tensor([2, 320, 24, 24])]; tensor reshape_25_cast_fp16 = reshape(shape = reshape_25_shape_0, x = real_div_6_cast_fp16)[name = tensor("reshape_25_cast_fp16")]; tensor add_13_gamma_0_to_fp16 = const()[name = tensor("add_13_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25836096)))]; tensor add_13_beta_0_to_fp16 = const()[name = tensor("add_13_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25836800)))]; tensor add_13_epsilon_0_to_fp16 = const()[name = tensor("add_13_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_13_cast_fp16 = batch_norm(beta = add_13_beta_0_to_fp16, epsilon = add_13_epsilon_0_to_fp16, gamma = add_13_gamma_0_to_fp16, mean = add_1_mean_0_to_fp16, variance = add_1_variance_0_to_fp16, x = reshape_25_cast_fp16)[name = tensor("add_13_cast_fp16")]; tensor input_67_cast_fp16 = silu(x = add_13_cast_fp16)[name = tensor("input_67_cast_fp16")]; tensor var_1007 = const()[name = tensor("op_1007"), val = tensor([1, 1])]; tensor var_1009 = const()[name = tensor("op_1009"), val = tensor([1, 1])]; tensor hidden_states_37_pad_type_0 = const()[name = tensor("hidden_states_37_pad_type_0"), val = tensor("custom")]; tensor hidden_states_37_pad_0 = const()[name = tensor("hidden_states_37_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_1_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(25837504)))]; tensor down_blocks_1_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29523968)))]; tensor hidden_states_37_cast_fp16 = conv(bias = down_blocks_1_resnets_0_conv1_bias_to_fp16, dilations = var_1009, groups = var_984, pad = hidden_states_37_pad_0, pad_type = hidden_states_37_pad_type_0, strides = var_1007, weight = down_blocks_1_resnets_0_conv1_weight_to_fp16, x = input_67_cast_fp16)[name = tensor("hidden_states_37_cast_fp16")]; tensor var_1015 = const()[name = tensor("op_1015"), val = tensor([1, 1])]; tensor var_1017 = const()[name = tensor("op_1017"), val = tensor([1, 1])]; tensor temb_5_pad_type_0 = const()[name = tensor("temb_5_pad_type_0"), val = tensor("custom")]; tensor temb_5_pad_0 = const()[name = tensor("temb_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29525312)))]; tensor down_blocks_1_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31163776)))]; tensor temb_5_cast_fp16 = conv(bias = down_blocks_1_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_1017, groups = var_984, pad = temb_5_pad_0, pad_type = temb_5_pad_type_0, strides = var_1015, weight = down_blocks_1_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_5_cast_fp16")]; tensor input_71_cast_fp16 = add(x = hidden_states_37_cast_fp16, y = temb_5_cast_fp16)[name = tensor("input_71_cast_fp16")]; tensor reshape_28_shape_0 = const()[name = tensor("reshape_28_shape_0"), val = tensor([2, 32, 20, 24, 24])]; tensor reshape_28_cast_fp16 = reshape(shape = reshape_28_shape_0, x = input_71_cast_fp16)[name = tensor("reshape_28_cast_fp16")]; tensor reduce_mean_21_axes_0 = const()[name = tensor("reduce_mean_21_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_21_keep_dims_0 = const()[name = tensor("reduce_mean_21_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_21_cast_fp16 = reduce_mean(axes = reduce_mean_21_axes_0, keep_dims = reduce_mean_21_keep_dims_0, x = reshape_28_cast_fp16)[name = tensor("reduce_mean_21_cast_fp16")]; tensor sub_14_cast_fp16 = sub(x = reshape_28_cast_fp16, y = reduce_mean_21_cast_fp16)[name = tensor("sub_14_cast_fp16")]; tensor square_7_cast_fp16 = square(x = sub_14_cast_fp16)[name = tensor("square_7_cast_fp16")]; tensor reduce_mean_23_axes_0 = const()[name = tensor("reduce_mean_23_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_23_keep_dims_0 = const()[name = tensor("reduce_mean_23_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_23_cast_fp16 = reduce_mean(axes = reduce_mean_23_axes_0, keep_dims = reduce_mean_23_keep_dims_0, x = square_7_cast_fp16)[name = tensor("reduce_mean_23_cast_fp16")]; tensor add_14_y_0_to_fp16 = const()[name = tensor("add_14_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_14_cast_fp16 = add(x = reduce_mean_23_cast_fp16, y = add_14_y_0_to_fp16)[name = tensor("add_14_cast_fp16")]; tensor sqrt_7_cast_fp16 = sqrt(x = add_14_cast_fp16)[name = tensor("sqrt_7_cast_fp16")]; tensor real_div_7_cast_fp16 = real_div(x = sub_14_cast_fp16, y = sqrt_7_cast_fp16)[name = tensor("real_div_7_cast_fp16")]; tensor reshape_29_shape_0 = const()[name = tensor("reshape_29_shape_0"), val = tensor([2, 640, 24, 24])]; tensor reshape_29_cast_fp16 = reshape(shape = reshape_29_shape_0, x = real_div_7_cast_fp16)[name = tensor("reshape_29_cast_fp16")]; tensor add_15_mean_0_to_fp16 = const()[name = tensor("add_15_mean_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31165120)))]; tensor add_15_variance_0_to_fp16 = const()[name = tensor("add_15_variance_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31166464)))]; tensor add_15_gamma_0_to_fp16 = const()[name = tensor("add_15_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31167808)))]; tensor add_15_beta_0_to_fp16 = const()[name = tensor("add_15_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31169152)))]; tensor add_15_epsilon_0_to_fp16 = const()[name = tensor("add_15_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_15_cast_fp16 = batch_norm(beta = add_15_beta_0_to_fp16, epsilon = add_15_epsilon_0_to_fp16, gamma = add_15_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_29_cast_fp16)[name = tensor("add_15_cast_fp16")]; tensor input_75_cast_fp16 = silu(x = add_15_cast_fp16)[name = tensor("input_75_cast_fp16")]; tensor var_1027 = const()[name = tensor("op_1027"), val = tensor([1, 1])]; tensor var_1029 = const()[name = tensor("op_1029"), val = tensor([1, 1])]; tensor hidden_states_39_pad_type_0 = const()[name = tensor("hidden_states_39_pad_type_0"), val = tensor("custom")]; tensor hidden_states_39_pad_0 = const()[name = tensor("hidden_states_39_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_1_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(31170496)))]; tensor down_blocks_1_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38543360)))]; tensor hidden_states_39_cast_fp16 = conv(bias = down_blocks_1_resnets_0_conv2_bias_to_fp16, dilations = var_1029, groups = var_984, pad = hidden_states_39_pad_0, pad_type = hidden_states_39_pad_type_0, strides = var_1027, weight = down_blocks_1_resnets_0_conv2_weight_to_fp16, x = input_75_cast_fp16)[name = tensor("hidden_states_39_cast_fp16")]; tensor var_1034 = const()[name = tensor("op_1034"), val = tensor([1, 1])]; tensor var_1036 = const()[name = tensor("op_1036"), val = tensor([1, 1])]; tensor x_1_pad_type_0 = const()[name = tensor("x_1_pad_type_0"), val = tensor("custom")]; tensor x_1_pad_0 = const()[name = tensor("x_1_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_resnets_0_conv_shortcut_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38544704)))]; tensor down_blocks_1_resnets_0_conv_shortcut_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_0_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38954368)))]; tensor x_1_cast_fp16 = conv(bias = down_blocks_1_resnets_0_conv_shortcut_bias_to_fp16, dilations = var_1036, groups = var_984, pad = x_1_pad_0, pad_type = x_1_pad_type_0, strides = var_1034, weight = down_blocks_1_resnets_0_conv_shortcut_weight_to_fp16, x = input_63_cast_fp16_1)[name = tensor("x_1_cast_fp16")]; tensor hidden_states_41_cast_fp16 = add(x = x_1_cast_fp16, y = hidden_states_39_cast_fp16)[name = tensor("hidden_states_41_cast_fp16")]; tensor reshape_32_shape_0 = const()[name = tensor("reshape_32_shape_0"), val = tensor([2, 32, 20, 24, 24])]; tensor reshape_32_cast_fp16 = reshape(shape = reshape_32_shape_0, x = hidden_states_41_cast_fp16)[name = tensor("reshape_32_cast_fp16")]; tensor reduce_mean_24_axes_0 = const()[name = tensor("reduce_mean_24_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_24_keep_dims_0 = const()[name = tensor("reduce_mean_24_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_24_cast_fp16 = reduce_mean(axes = reduce_mean_24_axes_0, keep_dims = reduce_mean_24_keep_dims_0, x = reshape_32_cast_fp16)[name = tensor("reduce_mean_24_cast_fp16")]; tensor sub_16_cast_fp16 = sub(x = reshape_32_cast_fp16, y = reduce_mean_24_cast_fp16)[name = tensor("sub_16_cast_fp16")]; tensor square_8_cast_fp16 = square(x = sub_16_cast_fp16)[name = tensor("square_8_cast_fp16")]; tensor reduce_mean_26_axes_0 = const()[name = tensor("reduce_mean_26_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_26_keep_dims_0 = const()[name = tensor("reduce_mean_26_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_26_cast_fp16 = reduce_mean(axes = reduce_mean_26_axes_0, keep_dims = reduce_mean_26_keep_dims_0, x = square_8_cast_fp16)[name = tensor("reduce_mean_26_cast_fp16")]; tensor add_16_y_0_to_fp16 = const()[name = tensor("add_16_y_0_to_fp16"), val = tensor(0x1.1p-20)]; tensor add_16_cast_fp16 = add(x = reduce_mean_26_cast_fp16, y = add_16_y_0_to_fp16)[name = tensor("add_16_cast_fp16")]; tensor sqrt_8_cast_fp16 = sqrt(x = add_16_cast_fp16)[name = tensor("sqrt_8_cast_fp16")]; tensor real_div_8_cast_fp16 = real_div(x = sub_16_cast_fp16, y = sqrt_8_cast_fp16)[name = tensor("real_div_8_cast_fp16")]; tensor reshape_33_shape_0 = const()[name = tensor("reshape_33_shape_0"), val = tensor([2, 640, 24, 24])]; tensor reshape_33_cast_fp16 = reshape(shape = reshape_33_shape_0, x = real_div_8_cast_fp16)[name = tensor("reshape_33_cast_fp16")]; tensor add_17_gamma_0_to_fp16 = const()[name = tensor("add_17_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38955712)))]; tensor add_17_beta_0_to_fp16 = const()[name = tensor("add_17_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38957056)))]; tensor add_17_epsilon_0_to_fp16 = const()[name = tensor("add_17_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_17_cast_fp16 = batch_norm(beta = add_17_beta_0_to_fp16, epsilon = add_17_epsilon_0_to_fp16, gamma = add_17_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_33_cast_fp16)[name = tensor("add_17_cast_fp16")]; tensor var_1056 = const()[name = tensor("op_1056"), val = tensor([1, 1])]; tensor var_1058 = const()[name = tensor("op_1058"), val = tensor([1, 1])]; tensor hidden_states_43_pad_type_0 = const()[name = tensor("hidden_states_43_pad_type_0"), val = tensor("custom")]; tensor hidden_states_43_pad_0 = const()[name = tensor("hidden_states_43_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(38958400)))]; tensor down_blocks_1_attentions_0_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39777664)))]; tensor hidden_states_43_cast_fp16 = conv(bias = down_blocks_1_attentions_0_proj_in_bias_to_fp16, dilations = var_1058, groups = var_984, pad = hidden_states_43_pad_0, pad_type = hidden_states_43_pad_type_0, strides = var_1056, weight = down_blocks_1_attentions_0_proj_in_weight_to_fp16, x = add_17_cast_fp16)[name = tensor("hidden_states_43_cast_fp16")]; tensor var_1063 = const()[name = tensor("op_1063"), val = tensor([2, 640, 1, 576])]; tensor inputs_13_cast_fp16 = reshape(shape = var_1063, x = hidden_states_43_cast_fp16)[name = tensor("inputs_13_cast_fp16")]; tensor var_1073 = const()[name = tensor("op_1073"), val = tensor([1])]; tensor channels_mean_13_cast_fp16 = reduce_mean(axes = var_1073, keep_dims = var_979, x = inputs_13_cast_fp16)[name = tensor("channels_mean_13_cast_fp16")]; tensor zero_mean_13_cast_fp16 = sub(x = inputs_13_cast_fp16, y = channels_mean_13_cast_fp16)[name = tensor("zero_mean_13_cast_fp16")]; tensor zero_mean_sq_13_cast_fp16 = mul(x = zero_mean_13_cast_fp16, y = zero_mean_13_cast_fp16)[name = tensor("zero_mean_sq_13_cast_fp16")]; tensor var_1077 = const()[name = tensor("op_1077"), val = tensor([1])]; tensor var_1078_cast_fp16 = reduce_mean(axes = var_1077, keep_dims = var_979, x = zero_mean_sq_13_cast_fp16)[name = tensor("op_1078_cast_fp16")]; tensor var_1079_to_fp16 = const()[name = tensor("op_1079_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1080_cast_fp16 = add(x = var_1078_cast_fp16, y = var_1079_to_fp16)[name = tensor("op_1080_cast_fp16")]; tensor denom_13_epsilon_0_to_fp16 = const()[name = tensor("denom_13_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_13_cast_fp16 = rsqrt(epsilon = denom_13_epsilon_0_to_fp16, x = var_1080_cast_fp16)[name = tensor("denom_13_cast_fp16")]; tensor out_13_cast_fp16 = mul(x = zero_mean_13_cast_fp16, y = denom_13_cast_fp16)[name = tensor("out_13_cast_fp16")]; tensor var_1084_to_fp16 = const()[name = tensor("op_1084_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39779008)))]; tensor var_1085_cast_fp16 = add(x = out_13_cast_fp16, y = var_1084_to_fp16)[name = tensor("op_1085_cast_fp16")]; tensor var_1087_to_fp16 = const()[name = tensor("op_1087_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39780352)))]; tensor hidden_states_45_cast_fp16 = mul(x = var_1085_cast_fp16, y = var_1087_to_fp16)[name = tensor("hidden_states_45_cast_fp16")]; tensor var_1094 = const()[name = tensor("op_1094"), val = tensor([1, 1])]; tensor var_1096 = const()[name = tensor("op_1096"), val = tensor([1, 1])]; tensor q_9_pad_type_0 = const()[name = tensor("q_9_pad_type_0"), val = tensor("custom")]; tensor q_9_pad_0 = const()[name = tensor("q_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39781696)))]; tensor q_9_cast_fp16 = conv(dilations = var_1096, groups = var_984, pad = q_9_pad_0, pad_type = q_9_pad_type_0, strides = var_1094, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_45_cast_fp16)[name = tensor("q_9_cast_fp16")]; tensor var_1100 = const()[name = tensor("op_1100"), val = tensor([1, 1])]; tensor var_1102 = const()[name = tensor("op_1102"), val = tensor([1, 1])]; tensor k_17_pad_type_0 = const()[name = tensor("k_17_pad_type_0"), val = tensor("custom")]; tensor k_17_pad_0 = const()[name = tensor("k_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(40600960)))]; tensor k_17_cast_fp16 = conv(dilations = var_1102, groups = var_984, pad = k_17_pad_0, pad_type = k_17_pad_type_0, strides = var_1100, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_45_cast_fp16)[name = tensor("k_17_cast_fp16")]; tensor var_1106 = const()[name = tensor("op_1106"), val = tensor([1, 1])]; tensor var_1108 = const()[name = tensor("op_1108"), val = tensor([1, 1])]; tensor v_9_pad_type_0 = const()[name = tensor("v_9_pad_type_0"), val = tensor("custom")]; tensor v_9_pad_0 = const()[name = tensor("v_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41420224)))]; tensor v_9_cast_fp16 = conv(dilations = var_1108, groups = var_984, pad = v_9_pad_0, pad_type = v_9_pad_type_0, strides = var_1106, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_45_cast_fp16)[name = tensor("v_9_cast_fp16")]; tensor var_1112_begin_0 = const()[name = tensor("op_1112_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_1112_end_0 = const()[name = tensor("op_1112_end_0"), val = tensor([2, 64, 1, 576])]; tensor var_1112_end_mask_0 = const()[name = tensor("op_1112_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1112_cast_fp16 = slice_by_index(begin = var_1112_begin_0, end = var_1112_end_0, end_mask = var_1112_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1112_cast_fp16")]; tensor var_1116_begin_0 = const()[name = tensor("op_1116_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_1116_end_0 = const()[name = tensor("op_1116_end_0"), val = tensor([2, 128, 1, 576])]; tensor var_1116_end_mask_0 = const()[name = tensor("op_1116_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1116_cast_fp16 = slice_by_index(begin = var_1116_begin_0, end = var_1116_end_0, end_mask = var_1116_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1116_cast_fp16")]; tensor var_1120_begin_0 = const()[name = tensor("op_1120_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_1120_end_0 = const()[name = tensor("op_1120_end_0"), val = tensor([2, 192, 1, 576])]; tensor var_1120_end_mask_0 = const()[name = tensor("op_1120_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1120_cast_fp16 = slice_by_index(begin = var_1120_begin_0, end = var_1120_end_0, end_mask = var_1120_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1120_cast_fp16")]; tensor var_1124_begin_0 = const()[name = tensor("op_1124_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_1124_end_0 = const()[name = tensor("op_1124_end_0"), val = tensor([2, 256, 1, 576])]; tensor var_1124_end_mask_0 = const()[name = tensor("op_1124_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1124_cast_fp16 = slice_by_index(begin = var_1124_begin_0, end = var_1124_end_0, end_mask = var_1124_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1124_cast_fp16")]; tensor var_1128_begin_0 = const()[name = tensor("op_1128_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_1128_end_0 = const()[name = tensor("op_1128_end_0"), val = tensor([2, 320, 1, 576])]; tensor var_1128_end_mask_0 = const()[name = tensor("op_1128_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1128_cast_fp16 = slice_by_index(begin = var_1128_begin_0, end = var_1128_end_0, end_mask = var_1128_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1128_cast_fp16")]; tensor var_1132_begin_0 = const()[name = tensor("op_1132_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_1132_end_0 = const()[name = tensor("op_1132_end_0"), val = tensor([2, 384, 1, 576])]; tensor var_1132_end_mask_0 = const()[name = tensor("op_1132_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1132_cast_fp16 = slice_by_index(begin = var_1132_begin_0, end = var_1132_end_0, end_mask = var_1132_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1132_cast_fp16")]; tensor var_1136_begin_0 = const()[name = tensor("op_1136_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_1136_end_0 = const()[name = tensor("op_1136_end_0"), val = tensor([2, 448, 1, 576])]; tensor var_1136_end_mask_0 = const()[name = tensor("op_1136_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1136_cast_fp16 = slice_by_index(begin = var_1136_begin_0, end = var_1136_end_0, end_mask = var_1136_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1136_cast_fp16")]; tensor var_1140_begin_0 = const()[name = tensor("op_1140_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_1140_end_0 = const()[name = tensor("op_1140_end_0"), val = tensor([2, 512, 1, 576])]; tensor var_1140_end_mask_0 = const()[name = tensor("op_1140_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1140_cast_fp16 = slice_by_index(begin = var_1140_begin_0, end = var_1140_end_0, end_mask = var_1140_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1140_cast_fp16")]; tensor var_1144_begin_0 = const()[name = tensor("op_1144_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_1144_end_0 = const()[name = tensor("op_1144_end_0"), val = tensor([2, 576, 1, 576])]; tensor var_1144_end_mask_0 = const()[name = tensor("op_1144_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1144_cast_fp16 = slice_by_index(begin = var_1144_begin_0, end = var_1144_end_0, end_mask = var_1144_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1144_cast_fp16")]; tensor var_1148_begin_0 = const()[name = tensor("op_1148_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_1148_end_0 = const()[name = tensor("op_1148_end_0"), val = tensor([2, 640, 1, 576])]; tensor var_1148_end_mask_0 = const()[name = tensor("op_1148_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1148_cast_fp16 = slice_by_index(begin = var_1148_begin_0, end = var_1148_end_0, end_mask = var_1148_end_mask_0, x = q_9_cast_fp16)[name = tensor("op_1148_cast_fp16")]; tensor k_19_perm_0 = const()[name = tensor("k_19_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_1155_begin_0 = const()[name = tensor("op_1155_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_1155_end_0 = const()[name = tensor("op_1155_end_0"), val = tensor([2, 576, 1, 64])]; tensor var_1155_end_mask_0 = const()[name = tensor("op_1155_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_9 = transpose(perm = k_19_perm_0, x = k_17_cast_fp16)[name = tensor("transpose_9")]; tensor var_1155_cast_fp16 = slice_by_index(begin = var_1155_begin_0, end = var_1155_end_0, end_mask = var_1155_end_mask_0, x = transpose_9)[name = tensor("op_1155_cast_fp16")]; tensor var_1159_begin_0 = const()[name = tensor("op_1159_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_1159_end_0 = const()[name = tensor("op_1159_end_0"), val = tensor([2, 576, 1, 128])]; tensor var_1159_end_mask_0 = const()[name = tensor("op_1159_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1159_cast_fp16 = slice_by_index(begin = var_1159_begin_0, end = var_1159_end_0, end_mask = var_1159_end_mask_0, x = transpose_9)[name = tensor("op_1159_cast_fp16")]; tensor var_1163_begin_0 = const()[name = tensor("op_1163_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_1163_end_0 = const()[name = tensor("op_1163_end_0"), val = tensor([2, 576, 1, 192])]; tensor var_1163_end_mask_0 = const()[name = tensor("op_1163_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1163_cast_fp16 = slice_by_index(begin = var_1163_begin_0, end = var_1163_end_0, end_mask = var_1163_end_mask_0, x = transpose_9)[name = tensor("op_1163_cast_fp16")]; tensor var_1167_begin_0 = const()[name = tensor("op_1167_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_1167_end_0 = const()[name = tensor("op_1167_end_0"), val = tensor([2, 576, 1, 256])]; tensor var_1167_end_mask_0 = const()[name = tensor("op_1167_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1167_cast_fp16 = slice_by_index(begin = var_1167_begin_0, end = var_1167_end_0, end_mask = var_1167_end_mask_0, x = transpose_9)[name = tensor("op_1167_cast_fp16")]; tensor var_1171_begin_0 = const()[name = tensor("op_1171_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_1171_end_0 = const()[name = tensor("op_1171_end_0"), val = tensor([2, 576, 1, 320])]; tensor var_1171_end_mask_0 = const()[name = tensor("op_1171_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1171_cast_fp16 = slice_by_index(begin = var_1171_begin_0, end = var_1171_end_0, end_mask = var_1171_end_mask_0, x = transpose_9)[name = tensor("op_1171_cast_fp16")]; tensor var_1175_begin_0 = const()[name = tensor("op_1175_begin_0"), val = tensor([0, 0, 0, 320])]; tensor var_1175_end_0 = const()[name = tensor("op_1175_end_0"), val = tensor([2, 576, 1, 384])]; tensor var_1175_end_mask_0 = const()[name = tensor("op_1175_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1175_cast_fp16 = slice_by_index(begin = var_1175_begin_0, end = var_1175_end_0, end_mask = var_1175_end_mask_0, x = transpose_9)[name = tensor("op_1175_cast_fp16")]; tensor var_1179_begin_0 = const()[name = tensor("op_1179_begin_0"), val = tensor([0, 0, 0, 384])]; tensor var_1179_end_0 = const()[name = tensor("op_1179_end_0"), val = tensor([2, 576, 1, 448])]; tensor var_1179_end_mask_0 = const()[name = tensor("op_1179_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1179_cast_fp16 = slice_by_index(begin = var_1179_begin_0, end = var_1179_end_0, end_mask = var_1179_end_mask_0, x = transpose_9)[name = tensor("op_1179_cast_fp16")]; tensor var_1183_begin_0 = const()[name = tensor("op_1183_begin_0"), val = tensor([0, 0, 0, 448])]; tensor var_1183_end_0 = const()[name = tensor("op_1183_end_0"), val = tensor([2, 576, 1, 512])]; tensor var_1183_end_mask_0 = const()[name = tensor("op_1183_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1183_cast_fp16 = slice_by_index(begin = var_1183_begin_0, end = var_1183_end_0, end_mask = var_1183_end_mask_0, x = transpose_9)[name = tensor("op_1183_cast_fp16")]; tensor var_1187_begin_0 = const()[name = tensor("op_1187_begin_0"), val = tensor([0, 0, 0, 512])]; tensor var_1187_end_0 = const()[name = tensor("op_1187_end_0"), val = tensor([2, 576, 1, 576])]; tensor var_1187_end_mask_0 = const()[name = tensor("op_1187_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1187_cast_fp16 = slice_by_index(begin = var_1187_begin_0, end = var_1187_end_0, end_mask = var_1187_end_mask_0, x = transpose_9)[name = tensor("op_1187_cast_fp16")]; tensor var_1191_begin_0 = const()[name = tensor("op_1191_begin_0"), val = tensor([0, 0, 0, 576])]; tensor var_1191_end_0 = const()[name = tensor("op_1191_end_0"), val = tensor([2, 576, 1, 640])]; tensor var_1191_end_mask_0 = const()[name = tensor("op_1191_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1191_cast_fp16 = slice_by_index(begin = var_1191_begin_0, end = var_1191_end_0, end_mask = var_1191_end_mask_0, x = transpose_9)[name = tensor("op_1191_cast_fp16")]; tensor var_1193_begin_0 = const()[name = tensor("op_1193_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_1193_end_0 = const()[name = tensor("op_1193_end_0"), val = tensor([2, 64, 1, 576])]; tensor var_1193_end_mask_0 = const()[name = tensor("op_1193_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1193_cast_fp16 = slice_by_index(begin = var_1193_begin_0, end = var_1193_end_0, end_mask = var_1193_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1193_cast_fp16")]; tensor var_1197_begin_0 = const()[name = tensor("op_1197_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_1197_end_0 = const()[name = tensor("op_1197_end_0"), val = tensor([2, 128, 1, 576])]; tensor var_1197_end_mask_0 = const()[name = tensor("op_1197_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1197_cast_fp16 = slice_by_index(begin = var_1197_begin_0, end = var_1197_end_0, end_mask = var_1197_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1197_cast_fp16")]; tensor var_1201_begin_0 = const()[name = tensor("op_1201_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_1201_end_0 = const()[name = tensor("op_1201_end_0"), val = tensor([2, 192, 1, 576])]; tensor var_1201_end_mask_0 = const()[name = tensor("op_1201_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1201_cast_fp16 = slice_by_index(begin = var_1201_begin_0, end = var_1201_end_0, end_mask = var_1201_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1201_cast_fp16")]; tensor var_1205_begin_0 = const()[name = tensor("op_1205_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_1205_end_0 = const()[name = tensor("op_1205_end_0"), val = tensor([2, 256, 1, 576])]; tensor var_1205_end_mask_0 = const()[name = tensor("op_1205_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1205_cast_fp16 = slice_by_index(begin = var_1205_begin_0, end = var_1205_end_0, end_mask = var_1205_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1205_cast_fp16")]; tensor var_1209_begin_0 = const()[name = tensor("op_1209_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_1209_end_0 = const()[name = tensor("op_1209_end_0"), val = tensor([2, 320, 1, 576])]; tensor var_1209_end_mask_0 = const()[name = tensor("op_1209_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1209_cast_fp16 = slice_by_index(begin = var_1209_begin_0, end = var_1209_end_0, end_mask = var_1209_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1209_cast_fp16")]; tensor var_1213_begin_0 = const()[name = tensor("op_1213_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_1213_end_0 = const()[name = tensor("op_1213_end_0"), val = tensor([2, 384, 1, 576])]; tensor var_1213_end_mask_0 = const()[name = tensor("op_1213_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1213_cast_fp16 = slice_by_index(begin = var_1213_begin_0, end = var_1213_end_0, end_mask = var_1213_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1213_cast_fp16")]; tensor var_1217_begin_0 = const()[name = tensor("op_1217_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_1217_end_0 = const()[name = tensor("op_1217_end_0"), val = tensor([2, 448, 1, 576])]; tensor var_1217_end_mask_0 = const()[name = tensor("op_1217_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1217_cast_fp16 = slice_by_index(begin = var_1217_begin_0, end = var_1217_end_0, end_mask = var_1217_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1217_cast_fp16")]; tensor var_1221_begin_0 = const()[name = tensor("op_1221_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_1221_end_0 = const()[name = tensor("op_1221_end_0"), val = tensor([2, 512, 1, 576])]; tensor var_1221_end_mask_0 = const()[name = tensor("op_1221_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1221_cast_fp16 = slice_by_index(begin = var_1221_begin_0, end = var_1221_end_0, end_mask = var_1221_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1221_cast_fp16")]; tensor var_1225_begin_0 = const()[name = tensor("op_1225_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_1225_end_0 = const()[name = tensor("op_1225_end_0"), val = tensor([2, 576, 1, 576])]; tensor var_1225_end_mask_0 = const()[name = tensor("op_1225_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1225_cast_fp16 = slice_by_index(begin = var_1225_begin_0, end = var_1225_end_0, end_mask = var_1225_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1225_cast_fp16")]; tensor var_1229_begin_0 = const()[name = tensor("op_1229_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_1229_end_0 = const()[name = tensor("op_1229_end_0"), val = tensor([2, 640, 1, 576])]; tensor var_1229_end_mask_0 = const()[name = tensor("op_1229_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1229_cast_fp16 = slice_by_index(begin = var_1229_begin_0, end = var_1229_end_0, end_mask = var_1229_end_mask_0, x = v_9_cast_fp16)[name = tensor("op_1229_cast_fp16")]; tensor var_1233_equation_0 = const()[name = tensor("op_1233_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1233_cast_fp16 = einsum(equation = var_1233_equation_0, values = (var_1155_cast_fp16, var_1112_cast_fp16))[name = tensor("op_1233_cast_fp16")]; tensor var_1234_to_fp16 = const()[name = tensor("op_1234_to_fp16"), val = tensor(0x1p-3)]; tensor aw_41_cast_fp16 = mul(x = var_1233_cast_fp16, y = var_1234_to_fp16)[name = tensor("aw_41_cast_fp16")]; tensor var_1237_equation_0 = const()[name = tensor("op_1237_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1237_cast_fp16 = einsum(equation = var_1237_equation_0, values = (var_1159_cast_fp16, var_1116_cast_fp16))[name = tensor("op_1237_cast_fp16")]; tensor var_1238_to_fp16 = const()[name = tensor("op_1238_to_fp16"), val = tensor(0x1p-3)]; tensor aw_43_cast_fp16 = mul(x = var_1237_cast_fp16, y = var_1238_to_fp16)[name = tensor("aw_43_cast_fp16")]; tensor var_1241_equation_0 = const()[name = tensor("op_1241_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1241_cast_fp16 = einsum(equation = var_1241_equation_0, values = (var_1163_cast_fp16, var_1120_cast_fp16))[name = tensor("op_1241_cast_fp16")]; tensor var_1242_to_fp16 = const()[name = tensor("op_1242_to_fp16"), val = tensor(0x1p-3)]; tensor aw_45_cast_fp16 = mul(x = var_1241_cast_fp16, y = var_1242_to_fp16)[name = tensor("aw_45_cast_fp16")]; tensor var_1245_equation_0 = const()[name = tensor("op_1245_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1245_cast_fp16 = einsum(equation = var_1245_equation_0, values = (var_1167_cast_fp16, var_1124_cast_fp16))[name = tensor("op_1245_cast_fp16")]; tensor var_1246_to_fp16 = const()[name = tensor("op_1246_to_fp16"), val = tensor(0x1p-3)]; tensor aw_47_cast_fp16 = mul(x = var_1245_cast_fp16, y = var_1246_to_fp16)[name = tensor("aw_47_cast_fp16")]; tensor var_1249_equation_0 = const()[name = tensor("op_1249_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1249_cast_fp16 = einsum(equation = var_1249_equation_0, values = (var_1171_cast_fp16, var_1128_cast_fp16))[name = tensor("op_1249_cast_fp16")]; tensor var_1250_to_fp16 = const()[name = tensor("op_1250_to_fp16"), val = tensor(0x1p-3)]; tensor aw_49_cast_fp16 = mul(x = var_1249_cast_fp16, y = var_1250_to_fp16)[name = tensor("aw_49_cast_fp16")]; tensor var_1253_equation_0 = const()[name = tensor("op_1253_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1253_cast_fp16 = einsum(equation = var_1253_equation_0, values = (var_1175_cast_fp16, var_1132_cast_fp16))[name = tensor("op_1253_cast_fp16")]; tensor var_1254_to_fp16 = const()[name = tensor("op_1254_to_fp16"), val = tensor(0x1p-3)]; tensor aw_51_cast_fp16 = mul(x = var_1253_cast_fp16, y = var_1254_to_fp16)[name = tensor("aw_51_cast_fp16")]; tensor var_1257_equation_0 = const()[name = tensor("op_1257_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1257_cast_fp16 = einsum(equation = var_1257_equation_0, values = (var_1179_cast_fp16, var_1136_cast_fp16))[name = tensor("op_1257_cast_fp16")]; tensor var_1258_to_fp16 = const()[name = tensor("op_1258_to_fp16"), val = tensor(0x1p-3)]; tensor aw_53_cast_fp16 = mul(x = var_1257_cast_fp16, y = var_1258_to_fp16)[name = tensor("aw_53_cast_fp16")]; tensor var_1261_equation_0 = const()[name = tensor("op_1261_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1261_cast_fp16 = einsum(equation = var_1261_equation_0, values = (var_1183_cast_fp16, var_1140_cast_fp16))[name = tensor("op_1261_cast_fp16")]; tensor var_1262_to_fp16 = const()[name = tensor("op_1262_to_fp16"), val = tensor(0x1p-3)]; tensor aw_55_cast_fp16 = mul(x = var_1261_cast_fp16, y = var_1262_to_fp16)[name = tensor("aw_55_cast_fp16")]; tensor var_1265_equation_0 = const()[name = tensor("op_1265_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1265_cast_fp16 = einsum(equation = var_1265_equation_0, values = (var_1187_cast_fp16, var_1144_cast_fp16))[name = tensor("op_1265_cast_fp16")]; tensor var_1266_to_fp16 = const()[name = tensor("op_1266_to_fp16"), val = tensor(0x1p-3)]; tensor aw_57_cast_fp16 = mul(x = var_1265_cast_fp16, y = var_1266_to_fp16)[name = tensor("aw_57_cast_fp16")]; tensor var_1269_equation_0 = const()[name = tensor("op_1269_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1269_cast_fp16 = einsum(equation = var_1269_equation_0, values = (var_1191_cast_fp16, var_1148_cast_fp16))[name = tensor("op_1269_cast_fp16")]; tensor var_1270_to_fp16 = const()[name = tensor("op_1270_to_fp16"), val = tensor(0x1p-3)]; tensor aw_59_cast_fp16 = mul(x = var_1269_cast_fp16, y = var_1270_to_fp16)[name = tensor("aw_59_cast_fp16")]; tensor var_1272_cast_fp16 = softmax(axis = var_984, x = aw_41_cast_fp16)[name = tensor("op_1272_cast_fp16")]; tensor var_1273_cast_fp16 = softmax(axis = var_984, x = aw_43_cast_fp16)[name = tensor("op_1273_cast_fp16")]; tensor var_1274_cast_fp16 = softmax(axis = var_984, x = aw_45_cast_fp16)[name = tensor("op_1274_cast_fp16")]; tensor var_1275_cast_fp16 = softmax(axis = var_984, x = aw_47_cast_fp16)[name = tensor("op_1275_cast_fp16")]; tensor var_1276_cast_fp16 = softmax(axis = var_984, x = aw_49_cast_fp16)[name = tensor("op_1276_cast_fp16")]; tensor var_1277_cast_fp16 = softmax(axis = var_984, x = aw_51_cast_fp16)[name = tensor("op_1277_cast_fp16")]; tensor var_1278_cast_fp16 = softmax(axis = var_984, x = aw_53_cast_fp16)[name = tensor("op_1278_cast_fp16")]; tensor var_1279_cast_fp16 = softmax(axis = var_984, x = aw_55_cast_fp16)[name = tensor("op_1279_cast_fp16")]; tensor var_1280_cast_fp16 = softmax(axis = var_984, x = aw_57_cast_fp16)[name = tensor("op_1280_cast_fp16")]; tensor var_1281_cast_fp16 = softmax(axis = var_984, x = aw_59_cast_fp16)[name = tensor("op_1281_cast_fp16")]; tensor var_1283_equation_0 = const()[name = tensor("op_1283_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1283_cast_fp16 = einsum(equation = var_1283_equation_0, values = (var_1193_cast_fp16, var_1272_cast_fp16))[name = tensor("op_1283_cast_fp16")]; tensor var_1285_equation_0 = const()[name = tensor("op_1285_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1285_cast_fp16 = einsum(equation = var_1285_equation_0, values = (var_1197_cast_fp16, var_1273_cast_fp16))[name = tensor("op_1285_cast_fp16")]; tensor var_1287_equation_0 = const()[name = tensor("op_1287_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1287_cast_fp16 = einsum(equation = var_1287_equation_0, values = (var_1201_cast_fp16, var_1274_cast_fp16))[name = tensor("op_1287_cast_fp16")]; tensor var_1289_equation_0 = const()[name = tensor("op_1289_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1289_cast_fp16 = einsum(equation = var_1289_equation_0, values = (var_1205_cast_fp16, var_1275_cast_fp16))[name = tensor("op_1289_cast_fp16")]; tensor var_1291_equation_0 = const()[name = tensor("op_1291_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1291_cast_fp16 = einsum(equation = var_1291_equation_0, values = (var_1209_cast_fp16, var_1276_cast_fp16))[name = tensor("op_1291_cast_fp16")]; tensor var_1293_equation_0 = const()[name = tensor("op_1293_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1293_cast_fp16 = einsum(equation = var_1293_equation_0, values = (var_1213_cast_fp16, var_1277_cast_fp16))[name = tensor("op_1293_cast_fp16")]; tensor var_1295_equation_0 = const()[name = tensor("op_1295_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1295_cast_fp16 = einsum(equation = var_1295_equation_0, values = (var_1217_cast_fp16, var_1278_cast_fp16))[name = tensor("op_1295_cast_fp16")]; tensor var_1297_equation_0 = const()[name = tensor("op_1297_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1297_cast_fp16 = einsum(equation = var_1297_equation_0, values = (var_1221_cast_fp16, var_1279_cast_fp16))[name = tensor("op_1297_cast_fp16")]; tensor var_1299_equation_0 = const()[name = tensor("op_1299_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1299_cast_fp16 = einsum(equation = var_1299_equation_0, values = (var_1225_cast_fp16, var_1280_cast_fp16))[name = tensor("op_1299_cast_fp16")]; tensor var_1301_equation_0 = const()[name = tensor("op_1301_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1301_cast_fp16 = einsum(equation = var_1301_equation_0, values = (var_1229_cast_fp16, var_1281_cast_fp16))[name = tensor("op_1301_cast_fp16")]; tensor input_79_interleave_0 = const()[name = tensor("input_79_interleave_0"), val = tensor(false)]; tensor input_79_cast_fp16 = concat(axis = var_984, interleave = input_79_interleave_0, values = (var_1283_cast_fp16, var_1285_cast_fp16, var_1287_cast_fp16, var_1289_cast_fp16, var_1291_cast_fp16, var_1293_cast_fp16, var_1295_cast_fp16, var_1297_cast_fp16, var_1299_cast_fp16, var_1301_cast_fp16))[name = tensor("input_79_cast_fp16")]; tensor var_1307 = const()[name = tensor("op_1307"), val = tensor([1, 1])]; tensor var_1309 = const()[name = tensor("op_1309"), val = tensor([1, 1])]; tensor var_1311_pad_type_0 = const()[name = tensor("op_1311_pad_type_0"), val = tensor("custom")]; tensor var_1311_pad_0 = const()[name = tensor("op_1311_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(42239488)))]; tensor down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43058752)))]; tensor var_1311_cast_fp16 = conv(bias = down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_1309, groups = var_984, pad = var_1311_pad_0, pad_type = var_1311_pad_type_0, strides = var_1307, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_79_cast_fp16)[name = tensor("op_1311_cast_fp16")]; tensor inputs_15_cast_fp16 = add(x = var_1311_cast_fp16, y = inputs_13_cast_fp16)[name = tensor("inputs_15_cast_fp16")]; tensor var_1315 = const()[name = tensor("op_1315"), val = tensor([1])]; tensor channels_mean_15_cast_fp16 = reduce_mean(axes = var_1315, keep_dims = var_979, x = inputs_15_cast_fp16)[name = tensor("channels_mean_15_cast_fp16")]; tensor zero_mean_15_cast_fp16 = sub(x = inputs_15_cast_fp16, y = channels_mean_15_cast_fp16)[name = tensor("zero_mean_15_cast_fp16")]; tensor zero_mean_sq_15_cast_fp16 = mul(x = zero_mean_15_cast_fp16, y = zero_mean_15_cast_fp16)[name = tensor("zero_mean_sq_15_cast_fp16")]; tensor var_1319 = const()[name = tensor("op_1319"), val = tensor([1])]; tensor var_1320_cast_fp16 = reduce_mean(axes = var_1319, keep_dims = var_979, x = zero_mean_sq_15_cast_fp16)[name = tensor("op_1320_cast_fp16")]; tensor var_1321_to_fp16 = const()[name = tensor("op_1321_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1322_cast_fp16 = add(x = var_1320_cast_fp16, y = var_1321_to_fp16)[name = tensor("op_1322_cast_fp16")]; tensor denom_15_epsilon_0_to_fp16 = const()[name = tensor("denom_15_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_15_cast_fp16 = rsqrt(epsilon = denom_15_epsilon_0_to_fp16, x = var_1322_cast_fp16)[name = tensor("denom_15_cast_fp16")]; tensor out_15_cast_fp16 = mul(x = zero_mean_15_cast_fp16, y = denom_15_cast_fp16)[name = tensor("out_15_cast_fp16")]; tensor var_1326_to_fp16 = const()[name = tensor("op_1326_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43060096)))]; tensor var_1327_cast_fp16 = add(x = out_15_cast_fp16, y = var_1326_to_fp16)[name = tensor("op_1327_cast_fp16")]; tensor var_1329_to_fp16 = const()[name = tensor("op_1329_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43061440)))]; tensor hidden_states_47_cast_fp16 = mul(x = var_1327_cast_fp16, y = var_1329_to_fp16)[name = tensor("hidden_states_47_cast_fp16")]; tensor var_1336 = const()[name = tensor("op_1336"), val = tensor([1, 1])]; tensor var_1338 = const()[name = tensor("op_1338"), val = tensor([1, 1])]; tensor q_11_pad_type_0 = const()[name = tensor("q_11_pad_type_0"), val = tensor("custom")]; tensor q_11_pad_0 = const()[name = tensor("q_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43062784)))]; tensor q_11_cast_fp16 = conv(dilations = var_1338, groups = var_984, pad = q_11_pad_0, pad_type = q_11_pad_type_0, strides = var_1336, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_47_cast_fp16)[name = tensor("q_11_cast_fp16")]; tensor var_1342 = const()[name = tensor("op_1342"), val = tensor([1, 1])]; tensor var_1344 = const()[name = tensor("op_1344"), val = tensor([1, 1])]; tensor k_21_pad_type_0 = const()[name = tensor("k_21_pad_type_0"), val = tensor("custom")]; tensor k_21_pad_0 = const()[name = tensor("k_21_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43882048)))]; tensor k_21_cast_fp16 = conv(dilations = var_1344, groups = var_984, pad = k_21_pad_0, pad_type = k_21_pad_type_0, strides = var_1342, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_21_cast_fp16")]; tensor var_1348 = const()[name = tensor("op_1348"), val = tensor([1, 1])]; tensor var_1350 = const()[name = tensor("op_1350"), val = tensor([1, 1])]; tensor v_11_pad_type_0 = const()[name = tensor("v_11_pad_type_0"), val = tensor("custom")]; tensor v_11_pad_0 = const()[name = tensor("v_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(45192832)))]; tensor v_11_cast_fp16 = conv(dilations = var_1350, groups = var_984, pad = v_11_pad_0, pad_type = v_11_pad_type_0, strides = var_1348, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_11_cast_fp16")]; tensor var_1354_begin_0 = const()[name = tensor("op_1354_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_1354_end_0 = const()[name = tensor("op_1354_end_0"), val = tensor([2, 64, 1, 576])]; tensor var_1354_end_mask_0 = const()[name = tensor("op_1354_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1354_cast_fp16 = slice_by_index(begin = var_1354_begin_0, end = var_1354_end_0, end_mask = var_1354_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1354_cast_fp16")]; tensor var_1358_begin_0 = const()[name = tensor("op_1358_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_1358_end_0 = const()[name = tensor("op_1358_end_0"), val = tensor([2, 128, 1, 576])]; tensor var_1358_end_mask_0 = const()[name = tensor("op_1358_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1358_cast_fp16 = slice_by_index(begin = var_1358_begin_0, end = var_1358_end_0, end_mask = var_1358_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1358_cast_fp16")]; tensor var_1362_begin_0 = const()[name = tensor("op_1362_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_1362_end_0 = const()[name = tensor("op_1362_end_0"), val = tensor([2, 192, 1, 576])]; tensor var_1362_end_mask_0 = const()[name = tensor("op_1362_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1362_cast_fp16 = slice_by_index(begin = var_1362_begin_0, end = var_1362_end_0, end_mask = var_1362_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1362_cast_fp16")]; tensor var_1366_begin_0 = const()[name = tensor("op_1366_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_1366_end_0 = const()[name = tensor("op_1366_end_0"), val = tensor([2, 256, 1, 576])]; tensor var_1366_end_mask_0 = const()[name = tensor("op_1366_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1366_cast_fp16 = slice_by_index(begin = var_1366_begin_0, end = var_1366_end_0, end_mask = var_1366_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1366_cast_fp16")]; tensor var_1370_begin_0 = const()[name = tensor("op_1370_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_1370_end_0 = const()[name = tensor("op_1370_end_0"), val = tensor([2, 320, 1, 576])]; tensor var_1370_end_mask_0 = const()[name = tensor("op_1370_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1370_cast_fp16 = slice_by_index(begin = var_1370_begin_0, end = var_1370_end_0, end_mask = var_1370_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1370_cast_fp16")]; tensor var_1374_begin_0 = const()[name = tensor("op_1374_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_1374_end_0 = const()[name = tensor("op_1374_end_0"), val = tensor([2, 384, 1, 576])]; tensor var_1374_end_mask_0 = const()[name = tensor("op_1374_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1374_cast_fp16 = slice_by_index(begin = var_1374_begin_0, end = var_1374_end_0, end_mask = var_1374_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1374_cast_fp16")]; tensor var_1378_begin_0 = const()[name = tensor("op_1378_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_1378_end_0 = const()[name = tensor("op_1378_end_0"), val = tensor([2, 448, 1, 576])]; tensor var_1378_end_mask_0 = const()[name = tensor("op_1378_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1378_cast_fp16 = slice_by_index(begin = var_1378_begin_0, end = var_1378_end_0, end_mask = var_1378_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1378_cast_fp16")]; tensor var_1382_begin_0 = const()[name = tensor("op_1382_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_1382_end_0 = const()[name = tensor("op_1382_end_0"), val = tensor([2, 512, 1, 576])]; tensor var_1382_end_mask_0 = const()[name = tensor("op_1382_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1382_cast_fp16 = slice_by_index(begin = var_1382_begin_0, end = var_1382_end_0, end_mask = var_1382_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1382_cast_fp16")]; tensor var_1386_begin_0 = const()[name = tensor("op_1386_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_1386_end_0 = const()[name = tensor("op_1386_end_0"), val = tensor([2, 576, 1, 576])]; tensor var_1386_end_mask_0 = const()[name = tensor("op_1386_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1386_cast_fp16 = slice_by_index(begin = var_1386_begin_0, end = var_1386_end_0, end_mask = var_1386_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1386_cast_fp16")]; tensor var_1390_begin_0 = const()[name = tensor("op_1390_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_1390_end_0 = const()[name = tensor("op_1390_end_0"), val = tensor([2, 640, 1, 576])]; tensor var_1390_end_mask_0 = const()[name = tensor("op_1390_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1390_cast_fp16 = slice_by_index(begin = var_1390_begin_0, end = var_1390_end_0, end_mask = var_1390_end_mask_0, x = q_11_cast_fp16)[name = tensor("op_1390_cast_fp16")]; tensor k_23_perm_0 = const()[name = tensor("k_23_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_1397_begin_0 = const()[name = tensor("op_1397_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_1397_end_0 = const()[name = tensor("op_1397_end_0"), val = tensor([2, 77, 1, 64])]; tensor var_1397_end_mask_0 = const()[name = tensor("op_1397_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_8 = transpose(perm = k_23_perm_0, x = k_21_cast_fp16)[name = tensor("transpose_8")]; tensor var_1397_cast_fp16 = slice_by_index(begin = var_1397_begin_0, end = var_1397_end_0, end_mask = var_1397_end_mask_0, x = transpose_8)[name = tensor("op_1397_cast_fp16")]; tensor var_1401_begin_0 = const()[name = tensor("op_1401_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_1401_end_0 = const()[name = tensor("op_1401_end_0"), val = tensor([2, 77, 1, 128])]; tensor var_1401_end_mask_0 = const()[name = tensor("op_1401_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1401_cast_fp16 = slice_by_index(begin = var_1401_begin_0, end = var_1401_end_0, end_mask = var_1401_end_mask_0, x = transpose_8)[name = tensor("op_1401_cast_fp16")]; tensor var_1405_begin_0 = const()[name = tensor("op_1405_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_1405_end_0 = const()[name = tensor("op_1405_end_0"), val = tensor([2, 77, 1, 192])]; tensor var_1405_end_mask_0 = const()[name = tensor("op_1405_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1405_cast_fp16 = slice_by_index(begin = var_1405_begin_0, end = var_1405_end_0, end_mask = var_1405_end_mask_0, x = transpose_8)[name = tensor("op_1405_cast_fp16")]; tensor var_1409_begin_0 = const()[name = tensor("op_1409_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_1409_end_0 = const()[name = tensor("op_1409_end_0"), val = tensor([2, 77, 1, 256])]; tensor var_1409_end_mask_0 = const()[name = tensor("op_1409_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1409_cast_fp16 = slice_by_index(begin = var_1409_begin_0, end = var_1409_end_0, end_mask = var_1409_end_mask_0, x = transpose_8)[name = tensor("op_1409_cast_fp16")]; tensor var_1413_begin_0 = const()[name = tensor("op_1413_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_1413_end_0 = const()[name = tensor("op_1413_end_0"), val = tensor([2, 77, 1, 320])]; tensor var_1413_end_mask_0 = const()[name = tensor("op_1413_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1413_cast_fp16 = slice_by_index(begin = var_1413_begin_0, end = var_1413_end_0, end_mask = var_1413_end_mask_0, x = transpose_8)[name = tensor("op_1413_cast_fp16")]; tensor var_1417_begin_0 = const()[name = tensor("op_1417_begin_0"), val = tensor([0, 0, 0, 320])]; tensor var_1417_end_0 = const()[name = tensor("op_1417_end_0"), val = tensor([2, 77, 1, 384])]; tensor var_1417_end_mask_0 = const()[name = tensor("op_1417_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1417_cast_fp16 = slice_by_index(begin = var_1417_begin_0, end = var_1417_end_0, end_mask = var_1417_end_mask_0, x = transpose_8)[name = tensor("op_1417_cast_fp16")]; tensor var_1421_begin_0 = const()[name = tensor("op_1421_begin_0"), val = tensor([0, 0, 0, 384])]; tensor var_1421_end_0 = const()[name = tensor("op_1421_end_0"), val = tensor([2, 77, 1, 448])]; tensor var_1421_end_mask_0 = const()[name = tensor("op_1421_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1421_cast_fp16 = slice_by_index(begin = var_1421_begin_0, end = var_1421_end_0, end_mask = var_1421_end_mask_0, x = transpose_8)[name = tensor("op_1421_cast_fp16")]; tensor var_1425_begin_0 = const()[name = tensor("op_1425_begin_0"), val = tensor([0, 0, 0, 448])]; tensor var_1425_end_0 = const()[name = tensor("op_1425_end_0"), val = tensor([2, 77, 1, 512])]; tensor var_1425_end_mask_0 = const()[name = tensor("op_1425_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1425_cast_fp16 = slice_by_index(begin = var_1425_begin_0, end = var_1425_end_0, end_mask = var_1425_end_mask_0, x = transpose_8)[name = tensor("op_1425_cast_fp16")]; tensor var_1429_begin_0 = const()[name = tensor("op_1429_begin_0"), val = tensor([0, 0, 0, 512])]; tensor var_1429_end_0 = const()[name = tensor("op_1429_end_0"), val = tensor([2, 77, 1, 576])]; tensor var_1429_end_mask_0 = const()[name = tensor("op_1429_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1429_cast_fp16 = slice_by_index(begin = var_1429_begin_0, end = var_1429_end_0, end_mask = var_1429_end_mask_0, x = transpose_8)[name = tensor("op_1429_cast_fp16")]; tensor var_1433_begin_0 = const()[name = tensor("op_1433_begin_0"), val = tensor([0, 0, 0, 576])]; tensor var_1433_end_0 = const()[name = tensor("op_1433_end_0"), val = tensor([2, 77, 1, 640])]; tensor var_1433_end_mask_0 = const()[name = tensor("op_1433_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1433_cast_fp16 = slice_by_index(begin = var_1433_begin_0, end = var_1433_end_0, end_mask = var_1433_end_mask_0, x = transpose_8)[name = tensor("op_1433_cast_fp16")]; tensor var_1435_begin_0 = const()[name = tensor("op_1435_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_1435_end_0 = const()[name = tensor("op_1435_end_0"), val = tensor([2, 64, 1, 77])]; tensor var_1435_end_mask_0 = const()[name = tensor("op_1435_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1435_cast_fp16 = slice_by_index(begin = var_1435_begin_0, end = var_1435_end_0, end_mask = var_1435_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1435_cast_fp16")]; tensor var_1439_begin_0 = const()[name = tensor("op_1439_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_1439_end_0 = const()[name = tensor("op_1439_end_0"), val = tensor([2, 128, 1, 77])]; tensor var_1439_end_mask_0 = const()[name = tensor("op_1439_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1439_cast_fp16 = slice_by_index(begin = var_1439_begin_0, end = var_1439_end_0, end_mask = var_1439_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1439_cast_fp16")]; tensor var_1443_begin_0 = const()[name = tensor("op_1443_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_1443_end_0 = const()[name = tensor("op_1443_end_0"), val = tensor([2, 192, 1, 77])]; tensor var_1443_end_mask_0 = const()[name = tensor("op_1443_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1443_cast_fp16 = slice_by_index(begin = var_1443_begin_0, end = var_1443_end_0, end_mask = var_1443_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1443_cast_fp16")]; tensor var_1447_begin_0 = const()[name = tensor("op_1447_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_1447_end_0 = const()[name = tensor("op_1447_end_0"), val = tensor([2, 256, 1, 77])]; tensor var_1447_end_mask_0 = const()[name = tensor("op_1447_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1447_cast_fp16 = slice_by_index(begin = var_1447_begin_0, end = var_1447_end_0, end_mask = var_1447_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1447_cast_fp16")]; tensor var_1451_begin_0 = const()[name = tensor("op_1451_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_1451_end_0 = const()[name = tensor("op_1451_end_0"), val = tensor([2, 320, 1, 77])]; tensor var_1451_end_mask_0 = const()[name = tensor("op_1451_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1451_cast_fp16 = slice_by_index(begin = var_1451_begin_0, end = var_1451_end_0, end_mask = var_1451_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1451_cast_fp16")]; tensor var_1455_begin_0 = const()[name = tensor("op_1455_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_1455_end_0 = const()[name = tensor("op_1455_end_0"), val = tensor([2, 384, 1, 77])]; tensor var_1455_end_mask_0 = const()[name = tensor("op_1455_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1455_cast_fp16 = slice_by_index(begin = var_1455_begin_0, end = var_1455_end_0, end_mask = var_1455_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1455_cast_fp16")]; tensor var_1459_begin_0 = const()[name = tensor("op_1459_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_1459_end_0 = const()[name = tensor("op_1459_end_0"), val = tensor([2, 448, 1, 77])]; tensor var_1459_end_mask_0 = const()[name = tensor("op_1459_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1459_cast_fp16 = slice_by_index(begin = var_1459_begin_0, end = var_1459_end_0, end_mask = var_1459_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1459_cast_fp16")]; tensor var_1463_begin_0 = const()[name = tensor("op_1463_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_1463_end_0 = const()[name = tensor("op_1463_end_0"), val = tensor([2, 512, 1, 77])]; tensor var_1463_end_mask_0 = const()[name = tensor("op_1463_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1463_cast_fp16 = slice_by_index(begin = var_1463_begin_0, end = var_1463_end_0, end_mask = var_1463_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1463_cast_fp16")]; tensor var_1467_begin_0 = const()[name = tensor("op_1467_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_1467_end_0 = const()[name = tensor("op_1467_end_0"), val = tensor([2, 576, 1, 77])]; tensor var_1467_end_mask_0 = const()[name = tensor("op_1467_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1467_cast_fp16 = slice_by_index(begin = var_1467_begin_0, end = var_1467_end_0, end_mask = var_1467_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1467_cast_fp16")]; tensor var_1471_begin_0 = const()[name = tensor("op_1471_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_1471_end_0 = const()[name = tensor("op_1471_end_0"), val = tensor([2, 640, 1, 77])]; tensor var_1471_end_mask_0 = const()[name = tensor("op_1471_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1471_cast_fp16 = slice_by_index(begin = var_1471_begin_0, end = var_1471_end_0, end_mask = var_1471_end_mask_0, x = v_11_cast_fp16)[name = tensor("op_1471_cast_fp16")]; tensor var_1475_equation_0 = const()[name = tensor("op_1475_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1475_cast_fp16 = einsum(equation = var_1475_equation_0, values = (var_1397_cast_fp16, var_1354_cast_fp16))[name = tensor("op_1475_cast_fp16")]; tensor var_1476_to_fp16 = const()[name = tensor("op_1476_to_fp16"), val = tensor(0x1p-3)]; tensor aw_61_cast_fp16 = mul(x = var_1475_cast_fp16, y = var_1476_to_fp16)[name = tensor("aw_61_cast_fp16")]; tensor var_1479_equation_0 = const()[name = tensor("op_1479_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1479_cast_fp16 = einsum(equation = var_1479_equation_0, values = (var_1401_cast_fp16, var_1358_cast_fp16))[name = tensor("op_1479_cast_fp16")]; tensor var_1480_to_fp16 = const()[name = tensor("op_1480_to_fp16"), val = tensor(0x1p-3)]; tensor aw_63_cast_fp16 = mul(x = var_1479_cast_fp16, y = var_1480_to_fp16)[name = tensor("aw_63_cast_fp16")]; tensor var_1483_equation_0 = const()[name = tensor("op_1483_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1483_cast_fp16 = einsum(equation = var_1483_equation_0, values = (var_1405_cast_fp16, var_1362_cast_fp16))[name = tensor("op_1483_cast_fp16")]; tensor var_1484_to_fp16 = const()[name = tensor("op_1484_to_fp16"), val = tensor(0x1p-3)]; tensor aw_65_cast_fp16 = mul(x = var_1483_cast_fp16, y = var_1484_to_fp16)[name = tensor("aw_65_cast_fp16")]; tensor var_1487_equation_0 = const()[name = tensor("op_1487_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1487_cast_fp16 = einsum(equation = var_1487_equation_0, values = (var_1409_cast_fp16, var_1366_cast_fp16))[name = tensor("op_1487_cast_fp16")]; tensor var_1488_to_fp16 = const()[name = tensor("op_1488_to_fp16"), val = tensor(0x1p-3)]; tensor aw_67_cast_fp16 = mul(x = var_1487_cast_fp16, y = var_1488_to_fp16)[name = tensor("aw_67_cast_fp16")]; tensor var_1491_equation_0 = const()[name = tensor("op_1491_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1491_cast_fp16 = einsum(equation = var_1491_equation_0, values = (var_1413_cast_fp16, var_1370_cast_fp16))[name = tensor("op_1491_cast_fp16")]; tensor var_1492_to_fp16 = const()[name = tensor("op_1492_to_fp16"), val = tensor(0x1p-3)]; tensor aw_69_cast_fp16 = mul(x = var_1491_cast_fp16, y = var_1492_to_fp16)[name = tensor("aw_69_cast_fp16")]; tensor var_1495_equation_0 = const()[name = tensor("op_1495_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1495_cast_fp16 = einsum(equation = var_1495_equation_0, values = (var_1417_cast_fp16, var_1374_cast_fp16))[name = tensor("op_1495_cast_fp16")]; tensor var_1496_to_fp16 = const()[name = tensor("op_1496_to_fp16"), val = tensor(0x1p-3)]; tensor aw_71_cast_fp16 = mul(x = var_1495_cast_fp16, y = var_1496_to_fp16)[name = tensor("aw_71_cast_fp16")]; tensor var_1499_equation_0 = const()[name = tensor("op_1499_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1499_cast_fp16 = einsum(equation = var_1499_equation_0, values = (var_1421_cast_fp16, var_1378_cast_fp16))[name = tensor("op_1499_cast_fp16")]; tensor var_1500_to_fp16 = const()[name = tensor("op_1500_to_fp16"), val = tensor(0x1p-3)]; tensor aw_73_cast_fp16 = mul(x = var_1499_cast_fp16, y = var_1500_to_fp16)[name = tensor("aw_73_cast_fp16")]; tensor var_1503_equation_0 = const()[name = tensor("op_1503_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1503_cast_fp16 = einsum(equation = var_1503_equation_0, values = (var_1425_cast_fp16, var_1382_cast_fp16))[name = tensor("op_1503_cast_fp16")]; tensor var_1504_to_fp16 = const()[name = tensor("op_1504_to_fp16"), val = tensor(0x1p-3)]; tensor aw_75_cast_fp16 = mul(x = var_1503_cast_fp16, y = var_1504_to_fp16)[name = tensor("aw_75_cast_fp16")]; tensor var_1507_equation_0 = const()[name = tensor("op_1507_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1507_cast_fp16 = einsum(equation = var_1507_equation_0, values = (var_1429_cast_fp16, var_1386_cast_fp16))[name = tensor("op_1507_cast_fp16")]; tensor var_1508_to_fp16 = const()[name = tensor("op_1508_to_fp16"), val = tensor(0x1p-3)]; tensor aw_77_cast_fp16 = mul(x = var_1507_cast_fp16, y = var_1508_to_fp16)[name = tensor("aw_77_cast_fp16")]; tensor var_1511_equation_0 = const()[name = tensor("op_1511_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1511_cast_fp16 = einsum(equation = var_1511_equation_0, values = (var_1433_cast_fp16, var_1390_cast_fp16))[name = tensor("op_1511_cast_fp16")]; tensor var_1512_to_fp16 = const()[name = tensor("op_1512_to_fp16"), val = tensor(0x1p-3)]; tensor aw_79_cast_fp16 = mul(x = var_1511_cast_fp16, y = var_1512_to_fp16)[name = tensor("aw_79_cast_fp16")]; tensor var_1514_cast_fp16 = softmax(axis = var_984, x = aw_61_cast_fp16)[name = tensor("op_1514_cast_fp16")]; tensor var_1515_cast_fp16 = softmax(axis = var_984, x = aw_63_cast_fp16)[name = tensor("op_1515_cast_fp16")]; tensor var_1516_cast_fp16 = softmax(axis = var_984, x = aw_65_cast_fp16)[name = tensor("op_1516_cast_fp16")]; tensor var_1517_cast_fp16 = softmax(axis = var_984, x = aw_67_cast_fp16)[name = tensor("op_1517_cast_fp16")]; tensor var_1518_cast_fp16 = softmax(axis = var_984, x = aw_69_cast_fp16)[name = tensor("op_1518_cast_fp16")]; tensor var_1519_cast_fp16 = softmax(axis = var_984, x = aw_71_cast_fp16)[name = tensor("op_1519_cast_fp16")]; tensor var_1520_cast_fp16 = softmax(axis = var_984, x = aw_73_cast_fp16)[name = tensor("op_1520_cast_fp16")]; tensor var_1521_cast_fp16 = softmax(axis = var_984, x = aw_75_cast_fp16)[name = tensor("op_1521_cast_fp16")]; tensor var_1522_cast_fp16 = softmax(axis = var_984, x = aw_77_cast_fp16)[name = tensor("op_1522_cast_fp16")]; tensor var_1523_cast_fp16 = softmax(axis = var_984, x = aw_79_cast_fp16)[name = tensor("op_1523_cast_fp16")]; tensor var_1525_equation_0 = const()[name = tensor("op_1525_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1525_cast_fp16 = einsum(equation = var_1525_equation_0, values = (var_1435_cast_fp16, var_1514_cast_fp16))[name = tensor("op_1525_cast_fp16")]; tensor var_1527_equation_0 = const()[name = tensor("op_1527_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1527_cast_fp16 = einsum(equation = var_1527_equation_0, values = (var_1439_cast_fp16, var_1515_cast_fp16))[name = tensor("op_1527_cast_fp16")]; tensor var_1529_equation_0 = const()[name = tensor("op_1529_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1529_cast_fp16 = einsum(equation = var_1529_equation_0, values = (var_1443_cast_fp16, var_1516_cast_fp16))[name = tensor("op_1529_cast_fp16")]; tensor var_1531_equation_0 = const()[name = tensor("op_1531_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1531_cast_fp16 = einsum(equation = var_1531_equation_0, values = (var_1447_cast_fp16, var_1517_cast_fp16))[name = tensor("op_1531_cast_fp16")]; tensor var_1533_equation_0 = const()[name = tensor("op_1533_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1533_cast_fp16 = einsum(equation = var_1533_equation_0, values = (var_1451_cast_fp16, var_1518_cast_fp16))[name = tensor("op_1533_cast_fp16")]; tensor var_1535_equation_0 = const()[name = tensor("op_1535_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1535_cast_fp16 = einsum(equation = var_1535_equation_0, values = (var_1455_cast_fp16, var_1519_cast_fp16))[name = tensor("op_1535_cast_fp16")]; tensor var_1537_equation_0 = const()[name = tensor("op_1537_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1537_cast_fp16 = einsum(equation = var_1537_equation_0, values = (var_1459_cast_fp16, var_1520_cast_fp16))[name = tensor("op_1537_cast_fp16")]; tensor var_1539_equation_0 = const()[name = tensor("op_1539_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1539_cast_fp16 = einsum(equation = var_1539_equation_0, values = (var_1463_cast_fp16, var_1521_cast_fp16))[name = tensor("op_1539_cast_fp16")]; tensor var_1541_equation_0 = const()[name = tensor("op_1541_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1541_cast_fp16 = einsum(equation = var_1541_equation_0, values = (var_1467_cast_fp16, var_1522_cast_fp16))[name = tensor("op_1541_cast_fp16")]; tensor var_1543_equation_0 = const()[name = tensor("op_1543_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1543_cast_fp16 = einsum(equation = var_1543_equation_0, values = (var_1471_cast_fp16, var_1523_cast_fp16))[name = tensor("op_1543_cast_fp16")]; tensor input_81_interleave_0 = const()[name = tensor("input_81_interleave_0"), val = tensor(false)]; tensor input_81_cast_fp16 = concat(axis = var_984, interleave = input_81_interleave_0, values = (var_1525_cast_fp16, var_1527_cast_fp16, var_1529_cast_fp16, var_1531_cast_fp16, var_1533_cast_fp16, var_1535_cast_fp16, var_1537_cast_fp16, var_1539_cast_fp16, var_1541_cast_fp16, var_1543_cast_fp16))[name = tensor("input_81_cast_fp16")]; tensor var_1549 = const()[name = tensor("op_1549"), val = tensor([1, 1])]; tensor var_1551 = const()[name = tensor("op_1551"), val = tensor([1, 1])]; tensor var_1553_pad_type_0 = const()[name = tensor("op_1553_pad_type_0"), val = tensor("custom")]; tensor var_1553_pad_0 = const()[name = tensor("op_1553_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(46503616)))]; tensor down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47322880)))]; tensor var_1553_cast_fp16 = conv(bias = down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_1551, groups = var_984, pad = var_1553_pad_0, pad_type = var_1553_pad_type_0, strides = var_1549, weight = down_blocks_1_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_81_cast_fp16)[name = tensor("op_1553_cast_fp16")]; tensor inputs_17_cast_fp16 = add(x = var_1553_cast_fp16, y = inputs_15_cast_fp16)[name = tensor("inputs_17_cast_fp16")]; tensor var_1557 = const()[name = tensor("op_1557"), val = tensor([1])]; tensor channels_mean_17_cast_fp16 = reduce_mean(axes = var_1557, keep_dims = var_979, x = inputs_17_cast_fp16)[name = tensor("channels_mean_17_cast_fp16")]; tensor zero_mean_17_cast_fp16 = sub(x = inputs_17_cast_fp16, y = channels_mean_17_cast_fp16)[name = tensor("zero_mean_17_cast_fp16")]; tensor zero_mean_sq_17_cast_fp16 = mul(x = zero_mean_17_cast_fp16, y = zero_mean_17_cast_fp16)[name = tensor("zero_mean_sq_17_cast_fp16")]; tensor var_1561 = const()[name = tensor("op_1561"), val = tensor([1])]; tensor var_1562_cast_fp16 = reduce_mean(axes = var_1561, keep_dims = var_979, x = zero_mean_sq_17_cast_fp16)[name = tensor("op_1562_cast_fp16")]; tensor var_1563_to_fp16 = const()[name = tensor("op_1563_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1564_cast_fp16 = add(x = var_1562_cast_fp16, y = var_1563_to_fp16)[name = tensor("op_1564_cast_fp16")]; tensor denom_17_epsilon_0_to_fp16 = const()[name = tensor("denom_17_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_17_cast_fp16 = rsqrt(epsilon = denom_17_epsilon_0_to_fp16, x = var_1564_cast_fp16)[name = tensor("denom_17_cast_fp16")]; tensor out_17_cast_fp16 = mul(x = zero_mean_17_cast_fp16, y = denom_17_cast_fp16)[name = tensor("out_17_cast_fp16")]; tensor var_1568_to_fp16 = const()[name = tensor("op_1568_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47324224)))]; tensor var_1569_cast_fp16 = add(x = out_17_cast_fp16, y = var_1568_to_fp16)[name = tensor("op_1569_cast_fp16")]; tensor var_1571_to_fp16 = const()[name = tensor("op_1571_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47325568)))]; tensor input_83_cast_fp16 = mul(x = var_1569_cast_fp16, y = var_1571_to_fp16)[name = tensor("input_83_cast_fp16")]; tensor var_1579 = const()[name = tensor("op_1579"), val = tensor([1, 1])]; tensor var_1581 = const()[name = tensor("op_1581"), val = tensor([1, 1])]; tensor var_1583_pad_type_0 = const()[name = tensor("op_1583_pad_type_0"), val = tensor("custom")]; tensor var_1583_pad_0 = const()[name = tensor("op_1583_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(47326912)))]; tensor down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53880576)))]; tensor var_1583_cast_fp16 = conv(bias = down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_1581, groups = var_984, pad = var_1583_pad_0, pad_type = var_1583_pad_type_0, strides = var_1579, weight = down_blocks_1_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_83_cast_fp16)[name = tensor("op_1583_cast_fp16")]; tensor var_1584_split_sizes_0 = const()[name = tensor("op_1584_split_sizes_0"), val = tensor([2560, 2560])]; tensor var_1584_axis_0 = const()[name = tensor("op_1584_axis_0"), val = tensor(1)]; tensor var_1584_cast_fp16_0, tensor var_1584_cast_fp16_1 = split(axis = var_1584_axis_0, split_sizes = var_1584_split_sizes_0, x = var_1583_cast_fp16)[name = tensor("op_1584_cast_fp16")]; tensor var_1586_mode_0 = const()[name = tensor("op_1586_mode_0"), val = tensor("EXACT")]; tensor var_1586_cast_fp16 = gelu(mode = var_1586_mode_0, x = var_1584_cast_fp16_1)[name = tensor("op_1586_cast_fp16")]; tensor input_85_cast_fp16 = mul(x = var_1584_cast_fp16_0, y = var_1586_cast_fp16)[name = tensor("input_85_cast_fp16")]; tensor var_1590 = const()[name = tensor("op_1590"), val = tensor([1, 1])]; tensor var_1592 = const()[name = tensor("op_1592"), val = tensor([1, 1])]; tensor var_1594_pad_type_0 = const()[name = tensor("op_1594_pad_type_0"), val = tensor("custom")]; tensor var_1594_pad_0 = const()[name = tensor("op_1594_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(53890880)))]; tensor down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57167744)))]; tensor var_1594_cast_fp16 = conv(bias = down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_1592, groups = var_984, pad = var_1594_pad_0, pad_type = var_1594_pad_type_0, strides = var_1590, weight = down_blocks_1_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_85_cast_fp16)[name = tensor("op_1594_cast_fp16")]; tensor hidden_states_51_cast_fp16 = add(x = var_1594_cast_fp16, y = inputs_17_cast_fp16)[name = tensor("hidden_states_51_cast_fp16")]; tensor var_1596 = const()[name = tensor("op_1596"), val = tensor([2, 640, 24, 24])]; tensor input_87_cast_fp16 = reshape(shape = var_1596, x = hidden_states_51_cast_fp16)[name = tensor("input_87_cast_fp16")]; tensor var_1600 = const()[name = tensor("op_1600"), val = tensor([1, 1])]; tensor var_1602 = const()[name = tensor("op_1602"), val = tensor([1, 1])]; tensor hidden_states_53_pad_type_0 = const()[name = tensor("hidden_states_53_pad_type_0"), val = tensor("custom")]; tensor hidden_states_53_pad_0 = const()[name = tensor("hidden_states_53_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_0_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57169088)))]; tensor down_blocks_1_attentions_0_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_0_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57988352)))]; tensor hidden_states_53_cast_fp16 = conv(bias = down_blocks_1_attentions_0_proj_out_bias_to_fp16, dilations = var_1602, groups = var_984, pad = hidden_states_53_pad_0, pad_type = hidden_states_53_pad_type_0, strides = var_1600, weight = down_blocks_1_attentions_0_proj_out_weight_to_fp16, x = input_87_cast_fp16)[name = tensor("hidden_states_53_cast_fp16")]; tensor input_89_cast_fp16_1 = add(x = hidden_states_53_cast_fp16, y = hidden_states_41_cast_fp16)[name = tensor("input_89_cast_fp16")]; tensor reshape_36_shape_0 = const()[name = tensor("reshape_36_shape_0"), val = tensor([2, 32, 20, 24, 24])]; tensor reshape_36_cast_fp16 = reshape(shape = reshape_36_shape_0, x = input_89_cast_fp16_1)[name = tensor("reshape_36_cast_fp16")]; tensor reduce_mean_27_axes_0 = const()[name = tensor("reduce_mean_27_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_27_keep_dims_0 = const()[name = tensor("reduce_mean_27_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_27_cast_fp16 = reduce_mean(axes = reduce_mean_27_axes_0, keep_dims = reduce_mean_27_keep_dims_0, x = reshape_36_cast_fp16)[name = tensor("reduce_mean_27_cast_fp16")]; tensor sub_18_cast_fp16 = sub(x = reshape_36_cast_fp16, y = reduce_mean_27_cast_fp16)[name = tensor("sub_18_cast_fp16")]; tensor square_9_cast_fp16 = square(x = sub_18_cast_fp16)[name = tensor("square_9_cast_fp16")]; tensor reduce_mean_29_axes_0 = const()[name = tensor("reduce_mean_29_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_29_keep_dims_0 = const()[name = tensor("reduce_mean_29_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_29_cast_fp16 = reduce_mean(axes = reduce_mean_29_axes_0, keep_dims = reduce_mean_29_keep_dims_0, x = square_9_cast_fp16)[name = tensor("reduce_mean_29_cast_fp16")]; tensor add_18_y_0_to_fp16 = const()[name = tensor("add_18_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_18_cast_fp16 = add(x = reduce_mean_29_cast_fp16, y = add_18_y_0_to_fp16)[name = tensor("add_18_cast_fp16")]; tensor sqrt_9_cast_fp16 = sqrt(x = add_18_cast_fp16)[name = tensor("sqrt_9_cast_fp16")]; tensor real_div_9_cast_fp16 = real_div(x = sub_18_cast_fp16, y = sqrt_9_cast_fp16)[name = tensor("real_div_9_cast_fp16")]; tensor reshape_37_shape_0 = const()[name = tensor("reshape_37_shape_0"), val = tensor([2, 640, 24, 24])]; tensor reshape_37_cast_fp16 = reshape(shape = reshape_37_shape_0, x = real_div_9_cast_fp16)[name = tensor("reshape_37_cast_fp16")]; tensor add_19_gamma_0_to_fp16 = const()[name = tensor("add_19_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57989696)))]; tensor add_19_beta_0_to_fp16 = const()[name = tensor("add_19_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57991040)))]; tensor add_19_epsilon_0_to_fp16 = const()[name = tensor("add_19_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_19_cast_fp16 = batch_norm(beta = add_19_beta_0_to_fp16, epsilon = add_19_epsilon_0_to_fp16, gamma = add_19_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_37_cast_fp16)[name = tensor("add_19_cast_fp16")]; tensor input_93_cast_fp16 = silu(x = add_19_cast_fp16)[name = tensor("input_93_cast_fp16")]; tensor var_1617 = const()[name = tensor("op_1617"), val = tensor([1, 1])]; tensor var_1619 = const()[name = tensor("op_1619"), val = tensor([1, 1])]; tensor hidden_states_55_pad_type_0 = const()[name = tensor("hidden_states_55_pad_type_0"), val = tensor("custom")]; tensor hidden_states_55_pad_0 = const()[name = tensor("hidden_states_55_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_1_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(57992384)))]; tensor down_blocks_1_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65365248)))]; tensor hidden_states_55_cast_fp16 = conv(bias = down_blocks_1_resnets_1_conv1_bias_to_fp16, dilations = var_1619, groups = var_984, pad = hidden_states_55_pad_0, pad_type = hidden_states_55_pad_type_0, strides = var_1617, weight = down_blocks_1_resnets_1_conv1_weight_to_fp16, x = input_93_cast_fp16)[name = tensor("hidden_states_55_cast_fp16")]; tensor var_1625 = const()[name = tensor("op_1625"), val = tensor([1, 1])]; tensor var_1627 = const()[name = tensor("op_1627"), val = tensor([1, 1])]; tensor temb_7_pad_type_0 = const()[name = tensor("temb_7_pad_type_0"), val = tensor("custom")]; tensor temb_7_pad_0 = const()[name = tensor("temb_7_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(65366592)))]; tensor down_blocks_1_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67005056)))]; tensor temb_7_cast_fp16 = conv(bias = down_blocks_1_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_1627, groups = var_984, pad = temb_7_pad_0, pad_type = temb_7_pad_type_0, strides = var_1625, weight = down_blocks_1_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_7_cast_fp16")]; tensor input_97_cast_fp16 = add(x = hidden_states_55_cast_fp16, y = temb_7_cast_fp16)[name = tensor("input_97_cast_fp16")]; tensor reshape_40_shape_0 = const()[name = tensor("reshape_40_shape_0"), val = tensor([2, 32, 20, 24, 24])]; tensor reshape_40_cast_fp16 = reshape(shape = reshape_40_shape_0, x = input_97_cast_fp16)[name = tensor("reshape_40_cast_fp16")]; tensor reduce_mean_30_axes_0 = const()[name = tensor("reduce_mean_30_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_30_keep_dims_0 = const()[name = tensor("reduce_mean_30_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_30_cast_fp16 = reduce_mean(axes = reduce_mean_30_axes_0, keep_dims = reduce_mean_30_keep_dims_0, x = reshape_40_cast_fp16)[name = tensor("reduce_mean_30_cast_fp16")]; tensor sub_20_cast_fp16 = sub(x = reshape_40_cast_fp16, y = reduce_mean_30_cast_fp16)[name = tensor("sub_20_cast_fp16")]; tensor square_10_cast_fp16 = square(x = sub_20_cast_fp16)[name = tensor("square_10_cast_fp16")]; tensor reduce_mean_32_axes_0 = const()[name = tensor("reduce_mean_32_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_32_keep_dims_0 = const()[name = tensor("reduce_mean_32_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_32_cast_fp16 = reduce_mean(axes = reduce_mean_32_axes_0, keep_dims = reduce_mean_32_keep_dims_0, x = square_10_cast_fp16)[name = tensor("reduce_mean_32_cast_fp16")]; tensor add_20_y_0_to_fp16 = const()[name = tensor("add_20_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_20_cast_fp16 = add(x = reduce_mean_32_cast_fp16, y = add_20_y_0_to_fp16)[name = tensor("add_20_cast_fp16")]; tensor sqrt_10_cast_fp16 = sqrt(x = add_20_cast_fp16)[name = tensor("sqrt_10_cast_fp16")]; tensor real_div_10_cast_fp16 = real_div(x = sub_20_cast_fp16, y = sqrt_10_cast_fp16)[name = tensor("real_div_10_cast_fp16")]; tensor reshape_41_shape_0 = const()[name = tensor("reshape_41_shape_0"), val = tensor([2, 640, 24, 24])]; tensor reshape_41_cast_fp16 = reshape(shape = reshape_41_shape_0, x = real_div_10_cast_fp16)[name = tensor("reshape_41_cast_fp16")]; tensor add_21_gamma_0_to_fp16 = const()[name = tensor("add_21_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67006400)))]; tensor add_21_beta_0_to_fp16 = const()[name = tensor("add_21_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67007744)))]; tensor add_21_epsilon_0_to_fp16 = const()[name = tensor("add_21_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_21_cast_fp16 = batch_norm(beta = add_21_beta_0_to_fp16, epsilon = add_21_epsilon_0_to_fp16, gamma = add_21_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_41_cast_fp16)[name = tensor("add_21_cast_fp16")]; tensor input_101_cast_fp16 = silu(x = add_21_cast_fp16)[name = tensor("input_101_cast_fp16")]; tensor var_1637 = const()[name = tensor("op_1637"), val = tensor([1, 1])]; tensor var_1639 = const()[name = tensor("op_1639"), val = tensor([1, 1])]; tensor hidden_states_57_pad_type_0 = const()[name = tensor("hidden_states_57_pad_type_0"), val = tensor("custom")]; tensor hidden_states_57_pad_0 = const()[name = tensor("hidden_states_57_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_1_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67009088)))]; tensor down_blocks_1_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_1_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(74381952)))]; tensor hidden_states_57_cast_fp16 = conv(bias = down_blocks_1_resnets_1_conv2_bias_to_fp16, dilations = var_1639, groups = var_984, pad = hidden_states_57_pad_0, pad_type = hidden_states_57_pad_type_0, strides = var_1637, weight = down_blocks_1_resnets_1_conv2_weight_to_fp16, x = input_101_cast_fp16)[name = tensor("hidden_states_57_cast_fp16")]; tensor hidden_states_59_cast_fp16 = add(x = input_89_cast_fp16_1, y = hidden_states_57_cast_fp16)[name = tensor("hidden_states_59_cast_fp16")]; tensor reshape_44_shape_0 = const()[name = tensor("reshape_44_shape_0"), val = tensor([2, 32, 20, 24, 24])]; tensor reshape_44_cast_fp16 = reshape(shape = reshape_44_shape_0, x = hidden_states_59_cast_fp16)[name = tensor("reshape_44_cast_fp16")]; tensor reduce_mean_33_axes_0 = const()[name = tensor("reduce_mean_33_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_33_keep_dims_0 = const()[name = tensor("reduce_mean_33_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_33_cast_fp16 = reduce_mean(axes = reduce_mean_33_axes_0, keep_dims = reduce_mean_33_keep_dims_0, x = reshape_44_cast_fp16)[name = tensor("reduce_mean_33_cast_fp16")]; tensor sub_22_cast_fp16 = sub(x = reshape_44_cast_fp16, y = reduce_mean_33_cast_fp16)[name = tensor("sub_22_cast_fp16")]; tensor square_11_cast_fp16 = square(x = sub_22_cast_fp16)[name = tensor("square_11_cast_fp16")]; tensor reduce_mean_35_axes_0 = const()[name = tensor("reduce_mean_35_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_35_keep_dims_0 = const()[name = tensor("reduce_mean_35_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_35_cast_fp16 = reduce_mean(axes = reduce_mean_35_axes_0, keep_dims = reduce_mean_35_keep_dims_0, x = square_11_cast_fp16)[name = tensor("reduce_mean_35_cast_fp16")]; tensor add_22_y_0_to_fp16 = const()[name = tensor("add_22_y_0_to_fp16"), val = tensor(0x1.1p-20)]; tensor add_22_cast_fp16 = add(x = reduce_mean_35_cast_fp16, y = add_22_y_0_to_fp16)[name = tensor("add_22_cast_fp16")]; tensor sqrt_11_cast_fp16 = sqrt(x = add_22_cast_fp16)[name = tensor("sqrt_11_cast_fp16")]; tensor real_div_11_cast_fp16 = real_div(x = sub_22_cast_fp16, y = sqrt_11_cast_fp16)[name = tensor("real_div_11_cast_fp16")]; tensor reshape_45_shape_0 = const()[name = tensor("reshape_45_shape_0"), val = tensor([2, 640, 24, 24])]; tensor reshape_45_cast_fp16 = reshape(shape = reshape_45_shape_0, x = real_div_11_cast_fp16)[name = tensor("reshape_45_cast_fp16")]; tensor add_23_gamma_0_to_fp16 = const()[name = tensor("add_23_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(74383296)))]; tensor add_23_beta_0_to_fp16 = const()[name = tensor("add_23_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(74384640)))]; tensor add_23_epsilon_0_to_fp16 = const()[name = tensor("add_23_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_23_cast_fp16 = batch_norm(beta = add_23_beta_0_to_fp16, epsilon = add_23_epsilon_0_to_fp16, gamma = add_23_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_45_cast_fp16)[name = tensor("add_23_cast_fp16")]; tensor var_1659 = const()[name = tensor("op_1659"), val = tensor([1, 1])]; tensor var_1661 = const()[name = tensor("op_1661"), val = tensor([1, 1])]; tensor hidden_states_61_pad_type_0 = const()[name = tensor("hidden_states_61_pad_type_0"), val = tensor("custom")]; tensor hidden_states_61_pad_0 = const()[name = tensor("hidden_states_61_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(74385984)))]; tensor down_blocks_1_attentions_1_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75205248)))]; tensor hidden_states_61_cast_fp16 = conv(bias = down_blocks_1_attentions_1_proj_in_bias_to_fp16, dilations = var_1661, groups = var_984, pad = hidden_states_61_pad_0, pad_type = hidden_states_61_pad_type_0, strides = var_1659, weight = down_blocks_1_attentions_1_proj_in_weight_to_fp16, x = add_23_cast_fp16)[name = tensor("hidden_states_61_cast_fp16")]; tensor var_1666 = const()[name = tensor("op_1666"), val = tensor([2, 640, 1, 576])]; tensor inputs_19_cast_fp16 = reshape(shape = var_1666, x = hidden_states_61_cast_fp16)[name = tensor("inputs_19_cast_fp16")]; tensor var_1676 = const()[name = tensor("op_1676"), val = tensor([1])]; tensor channels_mean_19_cast_fp16 = reduce_mean(axes = var_1676, keep_dims = var_979, x = inputs_19_cast_fp16)[name = tensor("channels_mean_19_cast_fp16")]; tensor zero_mean_19_cast_fp16 = sub(x = inputs_19_cast_fp16, y = channels_mean_19_cast_fp16)[name = tensor("zero_mean_19_cast_fp16")]; tensor zero_mean_sq_19_cast_fp16 = mul(x = zero_mean_19_cast_fp16, y = zero_mean_19_cast_fp16)[name = tensor("zero_mean_sq_19_cast_fp16")]; tensor var_1680 = const()[name = tensor("op_1680"), val = tensor([1])]; tensor var_1681_cast_fp16 = reduce_mean(axes = var_1680, keep_dims = var_979, x = zero_mean_sq_19_cast_fp16)[name = tensor("op_1681_cast_fp16")]; tensor var_1682_to_fp16 = const()[name = tensor("op_1682_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1683_cast_fp16 = add(x = var_1681_cast_fp16, y = var_1682_to_fp16)[name = tensor("op_1683_cast_fp16")]; tensor denom_19_epsilon_0_to_fp16 = const()[name = tensor("denom_19_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_19_cast_fp16 = rsqrt(epsilon = denom_19_epsilon_0_to_fp16, x = var_1683_cast_fp16)[name = tensor("denom_19_cast_fp16")]; tensor out_19_cast_fp16 = mul(x = zero_mean_19_cast_fp16, y = denom_19_cast_fp16)[name = tensor("out_19_cast_fp16")]; tensor var_1687_to_fp16 = const()[name = tensor("op_1687_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75206592)))]; tensor var_1688_cast_fp16 = add(x = out_19_cast_fp16, y = var_1687_to_fp16)[name = tensor("op_1688_cast_fp16")]; tensor var_1690_to_fp16 = const()[name = tensor("op_1690_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75207936)))]; tensor hidden_states_63_cast_fp16 = mul(x = var_1688_cast_fp16, y = var_1690_to_fp16)[name = tensor("hidden_states_63_cast_fp16")]; tensor var_1697 = const()[name = tensor("op_1697"), val = tensor([1, 1])]; tensor var_1699 = const()[name = tensor("op_1699"), val = tensor([1, 1])]; tensor q_13_pad_type_0 = const()[name = tensor("q_13_pad_type_0"), val = tensor("custom")]; tensor q_13_pad_0 = const()[name = tensor("q_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(75209280)))]; tensor q_13_cast_fp16 = conv(dilations = var_1699, groups = var_984, pad = q_13_pad_0, pad_type = q_13_pad_type_0, strides = var_1697, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_63_cast_fp16)[name = tensor("q_13_cast_fp16")]; tensor var_1703 = const()[name = tensor("op_1703"), val = tensor([1, 1])]; tensor var_1705 = const()[name = tensor("op_1705"), val = tensor([1, 1])]; tensor k_25_pad_type_0 = const()[name = tensor("k_25_pad_type_0"), val = tensor("custom")]; tensor k_25_pad_0 = const()[name = tensor("k_25_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(76028544)))]; tensor k_25_cast_fp16 = conv(dilations = var_1705, groups = var_984, pad = k_25_pad_0, pad_type = k_25_pad_type_0, strides = var_1703, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_63_cast_fp16)[name = tensor("k_25_cast_fp16")]; tensor var_1709 = const()[name = tensor("op_1709"), val = tensor([1, 1])]; tensor var_1711 = const()[name = tensor("op_1711"), val = tensor([1, 1])]; tensor v_13_pad_type_0 = const()[name = tensor("v_13_pad_type_0"), val = tensor("custom")]; tensor v_13_pad_0 = const()[name = tensor("v_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(76847808)))]; tensor v_13_cast_fp16 = conv(dilations = var_1711, groups = var_984, pad = v_13_pad_0, pad_type = v_13_pad_type_0, strides = var_1709, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_63_cast_fp16)[name = tensor("v_13_cast_fp16")]; tensor var_1715_begin_0 = const()[name = tensor("op_1715_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_1715_end_0 = const()[name = tensor("op_1715_end_0"), val = tensor([2, 64, 1, 576])]; tensor var_1715_end_mask_0 = const()[name = tensor("op_1715_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1715_cast_fp16 = slice_by_index(begin = var_1715_begin_0, end = var_1715_end_0, end_mask = var_1715_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1715_cast_fp16")]; tensor var_1719_begin_0 = const()[name = tensor("op_1719_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_1719_end_0 = const()[name = tensor("op_1719_end_0"), val = tensor([2, 128, 1, 576])]; tensor var_1719_end_mask_0 = const()[name = tensor("op_1719_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1719_cast_fp16 = slice_by_index(begin = var_1719_begin_0, end = var_1719_end_0, end_mask = var_1719_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1719_cast_fp16")]; tensor var_1723_begin_0 = const()[name = tensor("op_1723_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_1723_end_0 = const()[name = tensor("op_1723_end_0"), val = tensor([2, 192, 1, 576])]; tensor var_1723_end_mask_0 = const()[name = tensor("op_1723_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1723_cast_fp16 = slice_by_index(begin = var_1723_begin_0, end = var_1723_end_0, end_mask = var_1723_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1723_cast_fp16")]; tensor var_1727_begin_0 = const()[name = tensor("op_1727_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_1727_end_0 = const()[name = tensor("op_1727_end_0"), val = tensor([2, 256, 1, 576])]; tensor var_1727_end_mask_0 = const()[name = tensor("op_1727_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1727_cast_fp16 = slice_by_index(begin = var_1727_begin_0, end = var_1727_end_0, end_mask = var_1727_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1727_cast_fp16")]; tensor var_1731_begin_0 = const()[name = tensor("op_1731_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_1731_end_0 = const()[name = tensor("op_1731_end_0"), val = tensor([2, 320, 1, 576])]; tensor var_1731_end_mask_0 = const()[name = tensor("op_1731_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1731_cast_fp16 = slice_by_index(begin = var_1731_begin_0, end = var_1731_end_0, end_mask = var_1731_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1731_cast_fp16")]; tensor var_1735_begin_0 = const()[name = tensor("op_1735_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_1735_end_0 = const()[name = tensor("op_1735_end_0"), val = tensor([2, 384, 1, 576])]; tensor var_1735_end_mask_0 = const()[name = tensor("op_1735_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1735_cast_fp16 = slice_by_index(begin = var_1735_begin_0, end = var_1735_end_0, end_mask = var_1735_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1735_cast_fp16")]; tensor var_1739_begin_0 = const()[name = tensor("op_1739_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_1739_end_0 = const()[name = tensor("op_1739_end_0"), val = tensor([2, 448, 1, 576])]; tensor var_1739_end_mask_0 = const()[name = tensor("op_1739_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1739_cast_fp16 = slice_by_index(begin = var_1739_begin_0, end = var_1739_end_0, end_mask = var_1739_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1739_cast_fp16")]; tensor var_1743_begin_0 = const()[name = tensor("op_1743_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_1743_end_0 = const()[name = tensor("op_1743_end_0"), val = tensor([2, 512, 1, 576])]; tensor var_1743_end_mask_0 = const()[name = tensor("op_1743_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1743_cast_fp16 = slice_by_index(begin = var_1743_begin_0, end = var_1743_end_0, end_mask = var_1743_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1743_cast_fp16")]; tensor var_1747_begin_0 = const()[name = tensor("op_1747_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_1747_end_0 = const()[name = tensor("op_1747_end_0"), val = tensor([2, 576, 1, 576])]; tensor var_1747_end_mask_0 = const()[name = tensor("op_1747_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1747_cast_fp16 = slice_by_index(begin = var_1747_begin_0, end = var_1747_end_0, end_mask = var_1747_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1747_cast_fp16")]; tensor var_1751_begin_0 = const()[name = tensor("op_1751_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_1751_end_0 = const()[name = tensor("op_1751_end_0"), val = tensor([2, 640, 1, 576])]; tensor var_1751_end_mask_0 = const()[name = tensor("op_1751_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1751_cast_fp16 = slice_by_index(begin = var_1751_begin_0, end = var_1751_end_0, end_mask = var_1751_end_mask_0, x = q_13_cast_fp16)[name = tensor("op_1751_cast_fp16")]; tensor k_27_perm_0 = const()[name = tensor("k_27_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_1758_begin_0 = const()[name = tensor("op_1758_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_1758_end_0 = const()[name = tensor("op_1758_end_0"), val = tensor([2, 576, 1, 64])]; tensor var_1758_end_mask_0 = const()[name = tensor("op_1758_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_7 = transpose(perm = k_27_perm_0, x = k_25_cast_fp16)[name = tensor("transpose_7")]; tensor var_1758_cast_fp16 = slice_by_index(begin = var_1758_begin_0, end = var_1758_end_0, end_mask = var_1758_end_mask_0, x = transpose_7)[name = tensor("op_1758_cast_fp16")]; tensor var_1762_begin_0 = const()[name = tensor("op_1762_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_1762_end_0 = const()[name = tensor("op_1762_end_0"), val = tensor([2, 576, 1, 128])]; tensor var_1762_end_mask_0 = const()[name = tensor("op_1762_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1762_cast_fp16 = slice_by_index(begin = var_1762_begin_0, end = var_1762_end_0, end_mask = var_1762_end_mask_0, x = transpose_7)[name = tensor("op_1762_cast_fp16")]; tensor var_1766_begin_0 = const()[name = tensor("op_1766_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_1766_end_0 = const()[name = tensor("op_1766_end_0"), val = tensor([2, 576, 1, 192])]; tensor var_1766_end_mask_0 = const()[name = tensor("op_1766_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1766_cast_fp16 = slice_by_index(begin = var_1766_begin_0, end = var_1766_end_0, end_mask = var_1766_end_mask_0, x = transpose_7)[name = tensor("op_1766_cast_fp16")]; tensor var_1770_begin_0 = const()[name = tensor("op_1770_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_1770_end_0 = const()[name = tensor("op_1770_end_0"), val = tensor([2, 576, 1, 256])]; tensor var_1770_end_mask_0 = const()[name = tensor("op_1770_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1770_cast_fp16 = slice_by_index(begin = var_1770_begin_0, end = var_1770_end_0, end_mask = var_1770_end_mask_0, x = transpose_7)[name = tensor("op_1770_cast_fp16")]; tensor var_1774_begin_0 = const()[name = tensor("op_1774_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_1774_end_0 = const()[name = tensor("op_1774_end_0"), val = tensor([2, 576, 1, 320])]; tensor var_1774_end_mask_0 = const()[name = tensor("op_1774_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1774_cast_fp16 = slice_by_index(begin = var_1774_begin_0, end = var_1774_end_0, end_mask = var_1774_end_mask_0, x = transpose_7)[name = tensor("op_1774_cast_fp16")]; tensor var_1778_begin_0 = const()[name = tensor("op_1778_begin_0"), val = tensor([0, 0, 0, 320])]; tensor var_1778_end_0 = const()[name = tensor("op_1778_end_0"), val = tensor([2, 576, 1, 384])]; tensor var_1778_end_mask_0 = const()[name = tensor("op_1778_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1778_cast_fp16 = slice_by_index(begin = var_1778_begin_0, end = var_1778_end_0, end_mask = var_1778_end_mask_0, x = transpose_7)[name = tensor("op_1778_cast_fp16")]; tensor var_1782_begin_0 = const()[name = tensor("op_1782_begin_0"), val = tensor([0, 0, 0, 384])]; tensor var_1782_end_0 = const()[name = tensor("op_1782_end_0"), val = tensor([2, 576, 1, 448])]; tensor var_1782_end_mask_0 = const()[name = tensor("op_1782_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1782_cast_fp16 = slice_by_index(begin = var_1782_begin_0, end = var_1782_end_0, end_mask = var_1782_end_mask_0, x = transpose_7)[name = tensor("op_1782_cast_fp16")]; tensor var_1786_begin_0 = const()[name = tensor("op_1786_begin_0"), val = tensor([0, 0, 0, 448])]; tensor var_1786_end_0 = const()[name = tensor("op_1786_end_0"), val = tensor([2, 576, 1, 512])]; tensor var_1786_end_mask_0 = const()[name = tensor("op_1786_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1786_cast_fp16 = slice_by_index(begin = var_1786_begin_0, end = var_1786_end_0, end_mask = var_1786_end_mask_0, x = transpose_7)[name = tensor("op_1786_cast_fp16")]; tensor var_1790_begin_0 = const()[name = tensor("op_1790_begin_0"), val = tensor([0, 0, 0, 512])]; tensor var_1790_end_0 = const()[name = tensor("op_1790_end_0"), val = tensor([2, 576, 1, 576])]; tensor var_1790_end_mask_0 = const()[name = tensor("op_1790_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1790_cast_fp16 = slice_by_index(begin = var_1790_begin_0, end = var_1790_end_0, end_mask = var_1790_end_mask_0, x = transpose_7)[name = tensor("op_1790_cast_fp16")]; tensor var_1794_begin_0 = const()[name = tensor("op_1794_begin_0"), val = tensor([0, 0, 0, 576])]; tensor var_1794_end_0 = const()[name = tensor("op_1794_end_0"), val = tensor([2, 576, 1, 640])]; tensor var_1794_end_mask_0 = const()[name = tensor("op_1794_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_1794_cast_fp16 = slice_by_index(begin = var_1794_begin_0, end = var_1794_end_0, end_mask = var_1794_end_mask_0, x = transpose_7)[name = tensor("op_1794_cast_fp16")]; tensor var_1796_begin_0 = const()[name = tensor("op_1796_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_1796_end_0 = const()[name = tensor("op_1796_end_0"), val = tensor([2, 64, 1, 576])]; tensor var_1796_end_mask_0 = const()[name = tensor("op_1796_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1796_cast_fp16 = slice_by_index(begin = var_1796_begin_0, end = var_1796_end_0, end_mask = var_1796_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1796_cast_fp16")]; tensor var_1800_begin_0 = const()[name = tensor("op_1800_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_1800_end_0 = const()[name = tensor("op_1800_end_0"), val = tensor([2, 128, 1, 576])]; tensor var_1800_end_mask_0 = const()[name = tensor("op_1800_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1800_cast_fp16 = slice_by_index(begin = var_1800_begin_0, end = var_1800_end_0, end_mask = var_1800_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1800_cast_fp16")]; tensor var_1804_begin_0 = const()[name = tensor("op_1804_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_1804_end_0 = const()[name = tensor("op_1804_end_0"), val = tensor([2, 192, 1, 576])]; tensor var_1804_end_mask_0 = const()[name = tensor("op_1804_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1804_cast_fp16 = slice_by_index(begin = var_1804_begin_0, end = var_1804_end_0, end_mask = var_1804_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1804_cast_fp16")]; tensor var_1808_begin_0 = const()[name = tensor("op_1808_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_1808_end_0 = const()[name = tensor("op_1808_end_0"), val = tensor([2, 256, 1, 576])]; tensor var_1808_end_mask_0 = const()[name = tensor("op_1808_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1808_cast_fp16 = slice_by_index(begin = var_1808_begin_0, end = var_1808_end_0, end_mask = var_1808_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1808_cast_fp16")]; tensor var_1812_begin_0 = const()[name = tensor("op_1812_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_1812_end_0 = const()[name = tensor("op_1812_end_0"), val = tensor([2, 320, 1, 576])]; tensor var_1812_end_mask_0 = const()[name = tensor("op_1812_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1812_cast_fp16 = slice_by_index(begin = var_1812_begin_0, end = var_1812_end_0, end_mask = var_1812_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1812_cast_fp16")]; tensor var_1816_begin_0 = const()[name = tensor("op_1816_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_1816_end_0 = const()[name = tensor("op_1816_end_0"), val = tensor([2, 384, 1, 576])]; tensor var_1816_end_mask_0 = const()[name = tensor("op_1816_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1816_cast_fp16 = slice_by_index(begin = var_1816_begin_0, end = var_1816_end_0, end_mask = var_1816_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1816_cast_fp16")]; tensor var_1820_begin_0 = const()[name = tensor("op_1820_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_1820_end_0 = const()[name = tensor("op_1820_end_0"), val = tensor([2, 448, 1, 576])]; tensor var_1820_end_mask_0 = const()[name = tensor("op_1820_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1820_cast_fp16 = slice_by_index(begin = var_1820_begin_0, end = var_1820_end_0, end_mask = var_1820_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1820_cast_fp16")]; tensor var_1824_begin_0 = const()[name = tensor("op_1824_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_1824_end_0 = const()[name = tensor("op_1824_end_0"), val = tensor([2, 512, 1, 576])]; tensor var_1824_end_mask_0 = const()[name = tensor("op_1824_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1824_cast_fp16 = slice_by_index(begin = var_1824_begin_0, end = var_1824_end_0, end_mask = var_1824_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1824_cast_fp16")]; tensor var_1828_begin_0 = const()[name = tensor("op_1828_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_1828_end_0 = const()[name = tensor("op_1828_end_0"), val = tensor([2, 576, 1, 576])]; tensor var_1828_end_mask_0 = const()[name = tensor("op_1828_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1828_cast_fp16 = slice_by_index(begin = var_1828_begin_0, end = var_1828_end_0, end_mask = var_1828_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1828_cast_fp16")]; tensor var_1832_begin_0 = const()[name = tensor("op_1832_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_1832_end_0 = const()[name = tensor("op_1832_end_0"), val = tensor([2, 640, 1, 576])]; tensor var_1832_end_mask_0 = const()[name = tensor("op_1832_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1832_cast_fp16 = slice_by_index(begin = var_1832_begin_0, end = var_1832_end_0, end_mask = var_1832_end_mask_0, x = v_13_cast_fp16)[name = tensor("op_1832_cast_fp16")]; tensor var_1836_equation_0 = const()[name = tensor("op_1836_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1836_cast_fp16 = einsum(equation = var_1836_equation_0, values = (var_1758_cast_fp16, var_1715_cast_fp16))[name = tensor("op_1836_cast_fp16")]; tensor var_1837_to_fp16 = const()[name = tensor("op_1837_to_fp16"), val = tensor(0x1p-3)]; tensor aw_81_cast_fp16 = mul(x = var_1836_cast_fp16, y = var_1837_to_fp16)[name = tensor("aw_81_cast_fp16")]; tensor var_1840_equation_0 = const()[name = tensor("op_1840_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1840_cast_fp16 = einsum(equation = var_1840_equation_0, values = (var_1762_cast_fp16, var_1719_cast_fp16))[name = tensor("op_1840_cast_fp16")]; tensor var_1841_to_fp16 = const()[name = tensor("op_1841_to_fp16"), val = tensor(0x1p-3)]; tensor aw_83_cast_fp16 = mul(x = var_1840_cast_fp16, y = var_1841_to_fp16)[name = tensor("aw_83_cast_fp16")]; tensor var_1844_equation_0 = const()[name = tensor("op_1844_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1844_cast_fp16 = einsum(equation = var_1844_equation_0, values = (var_1766_cast_fp16, var_1723_cast_fp16))[name = tensor("op_1844_cast_fp16")]; tensor var_1845_to_fp16 = const()[name = tensor("op_1845_to_fp16"), val = tensor(0x1p-3)]; tensor aw_85_cast_fp16 = mul(x = var_1844_cast_fp16, y = var_1845_to_fp16)[name = tensor("aw_85_cast_fp16")]; tensor var_1848_equation_0 = const()[name = tensor("op_1848_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1848_cast_fp16 = einsum(equation = var_1848_equation_0, values = (var_1770_cast_fp16, var_1727_cast_fp16))[name = tensor("op_1848_cast_fp16")]; tensor var_1849_to_fp16 = const()[name = tensor("op_1849_to_fp16"), val = tensor(0x1p-3)]; tensor aw_87_cast_fp16 = mul(x = var_1848_cast_fp16, y = var_1849_to_fp16)[name = tensor("aw_87_cast_fp16")]; tensor var_1852_equation_0 = const()[name = tensor("op_1852_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1852_cast_fp16 = einsum(equation = var_1852_equation_0, values = (var_1774_cast_fp16, var_1731_cast_fp16))[name = tensor("op_1852_cast_fp16")]; tensor var_1853_to_fp16 = const()[name = tensor("op_1853_to_fp16"), val = tensor(0x1p-3)]; tensor aw_89_cast_fp16 = mul(x = var_1852_cast_fp16, y = var_1853_to_fp16)[name = tensor("aw_89_cast_fp16")]; tensor var_1856_equation_0 = const()[name = tensor("op_1856_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1856_cast_fp16 = einsum(equation = var_1856_equation_0, values = (var_1778_cast_fp16, var_1735_cast_fp16))[name = tensor("op_1856_cast_fp16")]; tensor var_1857_to_fp16 = const()[name = tensor("op_1857_to_fp16"), val = tensor(0x1p-3)]; tensor aw_91_cast_fp16 = mul(x = var_1856_cast_fp16, y = var_1857_to_fp16)[name = tensor("aw_91_cast_fp16")]; tensor var_1860_equation_0 = const()[name = tensor("op_1860_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1860_cast_fp16 = einsum(equation = var_1860_equation_0, values = (var_1782_cast_fp16, var_1739_cast_fp16))[name = tensor("op_1860_cast_fp16")]; tensor var_1861_to_fp16 = const()[name = tensor("op_1861_to_fp16"), val = tensor(0x1p-3)]; tensor aw_93_cast_fp16 = mul(x = var_1860_cast_fp16, y = var_1861_to_fp16)[name = tensor("aw_93_cast_fp16")]; tensor var_1864_equation_0 = const()[name = tensor("op_1864_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1864_cast_fp16 = einsum(equation = var_1864_equation_0, values = (var_1786_cast_fp16, var_1743_cast_fp16))[name = tensor("op_1864_cast_fp16")]; tensor var_1865_to_fp16 = const()[name = tensor("op_1865_to_fp16"), val = tensor(0x1p-3)]; tensor aw_95_cast_fp16 = mul(x = var_1864_cast_fp16, y = var_1865_to_fp16)[name = tensor("aw_95_cast_fp16")]; tensor var_1868_equation_0 = const()[name = tensor("op_1868_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1868_cast_fp16 = einsum(equation = var_1868_equation_0, values = (var_1790_cast_fp16, var_1747_cast_fp16))[name = tensor("op_1868_cast_fp16")]; tensor var_1869_to_fp16 = const()[name = tensor("op_1869_to_fp16"), val = tensor(0x1p-3)]; tensor aw_97_cast_fp16 = mul(x = var_1868_cast_fp16, y = var_1869_to_fp16)[name = tensor("aw_97_cast_fp16")]; tensor var_1872_equation_0 = const()[name = tensor("op_1872_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_1872_cast_fp16 = einsum(equation = var_1872_equation_0, values = (var_1794_cast_fp16, var_1751_cast_fp16))[name = tensor("op_1872_cast_fp16")]; tensor var_1873_to_fp16 = const()[name = tensor("op_1873_to_fp16"), val = tensor(0x1p-3)]; tensor aw_99_cast_fp16 = mul(x = var_1872_cast_fp16, y = var_1873_to_fp16)[name = tensor("aw_99_cast_fp16")]; tensor var_1875_cast_fp16 = softmax(axis = var_984, x = aw_81_cast_fp16)[name = tensor("op_1875_cast_fp16")]; tensor var_1876_cast_fp16 = softmax(axis = var_984, x = aw_83_cast_fp16)[name = tensor("op_1876_cast_fp16")]; tensor var_1877_cast_fp16 = softmax(axis = var_984, x = aw_85_cast_fp16)[name = tensor("op_1877_cast_fp16")]; tensor var_1878_cast_fp16 = softmax(axis = var_984, x = aw_87_cast_fp16)[name = tensor("op_1878_cast_fp16")]; tensor var_1879_cast_fp16 = softmax(axis = var_984, x = aw_89_cast_fp16)[name = tensor("op_1879_cast_fp16")]; tensor var_1880_cast_fp16 = softmax(axis = var_984, x = aw_91_cast_fp16)[name = tensor("op_1880_cast_fp16")]; tensor var_1881_cast_fp16 = softmax(axis = var_984, x = aw_93_cast_fp16)[name = tensor("op_1881_cast_fp16")]; tensor var_1882_cast_fp16 = softmax(axis = var_984, x = aw_95_cast_fp16)[name = tensor("op_1882_cast_fp16")]; tensor var_1883_cast_fp16 = softmax(axis = var_984, x = aw_97_cast_fp16)[name = tensor("op_1883_cast_fp16")]; tensor var_1884_cast_fp16 = softmax(axis = var_984, x = aw_99_cast_fp16)[name = tensor("op_1884_cast_fp16")]; tensor var_1886_equation_0 = const()[name = tensor("op_1886_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1886_cast_fp16 = einsum(equation = var_1886_equation_0, values = (var_1796_cast_fp16, var_1875_cast_fp16))[name = tensor("op_1886_cast_fp16")]; tensor var_1888_equation_0 = const()[name = tensor("op_1888_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1888_cast_fp16 = einsum(equation = var_1888_equation_0, values = (var_1800_cast_fp16, var_1876_cast_fp16))[name = tensor("op_1888_cast_fp16")]; tensor var_1890_equation_0 = const()[name = tensor("op_1890_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1890_cast_fp16 = einsum(equation = var_1890_equation_0, values = (var_1804_cast_fp16, var_1877_cast_fp16))[name = tensor("op_1890_cast_fp16")]; tensor var_1892_equation_0 = const()[name = tensor("op_1892_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1892_cast_fp16 = einsum(equation = var_1892_equation_0, values = (var_1808_cast_fp16, var_1878_cast_fp16))[name = tensor("op_1892_cast_fp16")]; tensor var_1894_equation_0 = const()[name = tensor("op_1894_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1894_cast_fp16 = einsum(equation = var_1894_equation_0, values = (var_1812_cast_fp16, var_1879_cast_fp16))[name = tensor("op_1894_cast_fp16")]; tensor var_1896_equation_0 = const()[name = tensor("op_1896_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1896_cast_fp16 = einsum(equation = var_1896_equation_0, values = (var_1816_cast_fp16, var_1880_cast_fp16))[name = tensor("op_1896_cast_fp16")]; tensor var_1898_equation_0 = const()[name = tensor("op_1898_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1898_cast_fp16 = einsum(equation = var_1898_equation_0, values = (var_1820_cast_fp16, var_1881_cast_fp16))[name = tensor("op_1898_cast_fp16")]; tensor var_1900_equation_0 = const()[name = tensor("op_1900_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1900_cast_fp16 = einsum(equation = var_1900_equation_0, values = (var_1824_cast_fp16, var_1882_cast_fp16))[name = tensor("op_1900_cast_fp16")]; tensor var_1902_equation_0 = const()[name = tensor("op_1902_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1902_cast_fp16 = einsum(equation = var_1902_equation_0, values = (var_1828_cast_fp16, var_1883_cast_fp16))[name = tensor("op_1902_cast_fp16")]; tensor var_1904_equation_0 = const()[name = tensor("op_1904_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_1904_cast_fp16 = einsum(equation = var_1904_equation_0, values = (var_1832_cast_fp16, var_1884_cast_fp16))[name = tensor("op_1904_cast_fp16")]; tensor input_105_interleave_0 = const()[name = tensor("input_105_interleave_0"), val = tensor(false)]; tensor input_105_cast_fp16 = concat(axis = var_984, interleave = input_105_interleave_0, values = (var_1886_cast_fp16, var_1888_cast_fp16, var_1890_cast_fp16, var_1892_cast_fp16, var_1894_cast_fp16, var_1896_cast_fp16, var_1898_cast_fp16, var_1900_cast_fp16, var_1902_cast_fp16, var_1904_cast_fp16))[name = tensor("input_105_cast_fp16")]; tensor var_1910 = const()[name = tensor("op_1910"), val = tensor([1, 1])]; tensor var_1912 = const()[name = tensor("op_1912"), val = tensor([1, 1])]; tensor var_1914_pad_type_0 = const()[name = tensor("op_1914_pad_type_0"), val = tensor("custom")]; tensor var_1914_pad_0 = const()[name = tensor("op_1914_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(77667072)))]; tensor down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78486336)))]; tensor var_1914_cast_fp16 = conv(bias = down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_1912, groups = var_984, pad = var_1914_pad_0, pad_type = var_1914_pad_type_0, strides = var_1910, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_105_cast_fp16)[name = tensor("op_1914_cast_fp16")]; tensor inputs_21_cast_fp16 = add(x = var_1914_cast_fp16, y = inputs_19_cast_fp16)[name = tensor("inputs_21_cast_fp16")]; tensor var_1918 = const()[name = tensor("op_1918"), val = tensor([1])]; tensor channels_mean_21_cast_fp16 = reduce_mean(axes = var_1918, keep_dims = var_979, x = inputs_21_cast_fp16)[name = tensor("channels_mean_21_cast_fp16")]; tensor zero_mean_21_cast_fp16 = sub(x = inputs_21_cast_fp16, y = channels_mean_21_cast_fp16)[name = tensor("zero_mean_21_cast_fp16")]; tensor zero_mean_sq_21_cast_fp16 = mul(x = zero_mean_21_cast_fp16, y = zero_mean_21_cast_fp16)[name = tensor("zero_mean_sq_21_cast_fp16")]; tensor var_1922 = const()[name = tensor("op_1922"), val = tensor([1])]; tensor var_1923_cast_fp16 = reduce_mean(axes = var_1922, keep_dims = var_979, x = zero_mean_sq_21_cast_fp16)[name = tensor("op_1923_cast_fp16")]; tensor var_1924_to_fp16 = const()[name = tensor("op_1924_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1925_cast_fp16 = add(x = var_1923_cast_fp16, y = var_1924_to_fp16)[name = tensor("op_1925_cast_fp16")]; tensor denom_21_epsilon_0_to_fp16 = const()[name = tensor("denom_21_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_21_cast_fp16 = rsqrt(epsilon = denom_21_epsilon_0_to_fp16, x = var_1925_cast_fp16)[name = tensor("denom_21_cast_fp16")]; tensor out_21_cast_fp16 = mul(x = zero_mean_21_cast_fp16, y = denom_21_cast_fp16)[name = tensor("out_21_cast_fp16")]; tensor var_1929_to_fp16 = const()[name = tensor("op_1929_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78487680)))]; tensor var_1930_cast_fp16 = add(x = out_21_cast_fp16, y = var_1929_to_fp16)[name = tensor("op_1930_cast_fp16")]; tensor var_1932_to_fp16 = const()[name = tensor("op_1932_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78489024)))]; tensor hidden_states_65_cast_fp16 = mul(x = var_1930_cast_fp16, y = var_1932_to_fp16)[name = tensor("hidden_states_65_cast_fp16")]; tensor var_1939 = const()[name = tensor("op_1939"), val = tensor([1, 1])]; tensor var_1941 = const()[name = tensor("op_1941"), val = tensor([1, 1])]; tensor q_15_pad_type_0 = const()[name = tensor("q_15_pad_type_0"), val = tensor("custom")]; tensor q_15_pad_0 = const()[name = tensor("q_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(78490368)))]; tensor q_15_cast_fp16 = conv(dilations = var_1941, groups = var_984, pad = q_15_pad_0, pad_type = q_15_pad_type_0, strides = var_1939, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_65_cast_fp16)[name = tensor("q_15_cast_fp16")]; tensor var_1945 = const()[name = tensor("op_1945"), val = tensor([1, 1])]; tensor var_1947 = const()[name = tensor("op_1947"), val = tensor([1, 1])]; tensor k_29_pad_type_0 = const()[name = tensor("k_29_pad_type_0"), val = tensor("custom")]; tensor k_29_pad_0 = const()[name = tensor("k_29_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(79309632)))]; tensor k_29_cast_fp16 = conv(dilations = var_1947, groups = var_984, pad = k_29_pad_0, pad_type = k_29_pad_type_0, strides = var_1945, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_29_cast_fp16")]; tensor var_1951 = const()[name = tensor("op_1951"), val = tensor([1, 1])]; tensor var_1953 = const()[name = tensor("op_1953"), val = tensor([1, 1])]; tensor v_15_pad_type_0 = const()[name = tensor("v_15_pad_type_0"), val = tensor("custom")]; tensor v_15_pad_0 = const()[name = tensor("v_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(80620416)))]; tensor v_15_cast_fp16 = conv(dilations = var_1953, groups = var_984, pad = v_15_pad_0, pad_type = v_15_pad_type_0, strides = var_1951, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_15_cast_fp16")]; tensor var_1957_begin_0 = const()[name = tensor("op_1957_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_1957_end_0 = const()[name = tensor("op_1957_end_0"), val = tensor([2, 64, 1, 576])]; tensor var_1957_end_mask_0 = const()[name = tensor("op_1957_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1957_cast_fp16 = slice_by_index(begin = var_1957_begin_0, end = var_1957_end_0, end_mask = var_1957_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1957_cast_fp16")]; tensor var_1961_begin_0 = const()[name = tensor("op_1961_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_1961_end_0 = const()[name = tensor("op_1961_end_0"), val = tensor([2, 128, 1, 576])]; tensor var_1961_end_mask_0 = const()[name = tensor("op_1961_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1961_cast_fp16 = slice_by_index(begin = var_1961_begin_0, end = var_1961_end_0, end_mask = var_1961_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1961_cast_fp16")]; tensor var_1965_begin_0 = const()[name = tensor("op_1965_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_1965_end_0 = const()[name = tensor("op_1965_end_0"), val = tensor([2, 192, 1, 576])]; tensor var_1965_end_mask_0 = const()[name = tensor("op_1965_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1965_cast_fp16 = slice_by_index(begin = var_1965_begin_0, end = var_1965_end_0, end_mask = var_1965_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1965_cast_fp16")]; tensor var_1969_begin_0 = const()[name = tensor("op_1969_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_1969_end_0 = const()[name = tensor("op_1969_end_0"), val = tensor([2, 256, 1, 576])]; tensor var_1969_end_mask_0 = const()[name = tensor("op_1969_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1969_cast_fp16 = slice_by_index(begin = var_1969_begin_0, end = var_1969_end_0, end_mask = var_1969_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1969_cast_fp16")]; tensor var_1973_begin_0 = const()[name = tensor("op_1973_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_1973_end_0 = const()[name = tensor("op_1973_end_0"), val = tensor([2, 320, 1, 576])]; tensor var_1973_end_mask_0 = const()[name = tensor("op_1973_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1973_cast_fp16 = slice_by_index(begin = var_1973_begin_0, end = var_1973_end_0, end_mask = var_1973_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1973_cast_fp16")]; tensor var_1977_begin_0 = const()[name = tensor("op_1977_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_1977_end_0 = const()[name = tensor("op_1977_end_0"), val = tensor([2, 384, 1, 576])]; tensor var_1977_end_mask_0 = const()[name = tensor("op_1977_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1977_cast_fp16 = slice_by_index(begin = var_1977_begin_0, end = var_1977_end_0, end_mask = var_1977_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1977_cast_fp16")]; tensor var_1981_begin_0 = const()[name = tensor("op_1981_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_1981_end_0 = const()[name = tensor("op_1981_end_0"), val = tensor([2, 448, 1, 576])]; tensor var_1981_end_mask_0 = const()[name = tensor("op_1981_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1981_cast_fp16 = slice_by_index(begin = var_1981_begin_0, end = var_1981_end_0, end_mask = var_1981_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1981_cast_fp16")]; tensor var_1985_begin_0 = const()[name = tensor("op_1985_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_1985_end_0 = const()[name = tensor("op_1985_end_0"), val = tensor([2, 512, 1, 576])]; tensor var_1985_end_mask_0 = const()[name = tensor("op_1985_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1985_cast_fp16 = slice_by_index(begin = var_1985_begin_0, end = var_1985_end_0, end_mask = var_1985_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1985_cast_fp16")]; tensor var_1989_begin_0 = const()[name = tensor("op_1989_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_1989_end_0 = const()[name = tensor("op_1989_end_0"), val = tensor([2, 576, 1, 576])]; tensor var_1989_end_mask_0 = const()[name = tensor("op_1989_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1989_cast_fp16 = slice_by_index(begin = var_1989_begin_0, end = var_1989_end_0, end_mask = var_1989_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1989_cast_fp16")]; tensor var_1993_begin_0 = const()[name = tensor("op_1993_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_1993_end_0 = const()[name = tensor("op_1993_end_0"), val = tensor([2, 640, 1, 576])]; tensor var_1993_end_mask_0 = const()[name = tensor("op_1993_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_1993_cast_fp16 = slice_by_index(begin = var_1993_begin_0, end = var_1993_end_0, end_mask = var_1993_end_mask_0, x = q_15_cast_fp16)[name = tensor("op_1993_cast_fp16")]; tensor k_31_perm_0 = const()[name = tensor("k_31_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_2000_begin_0 = const()[name = tensor("op_2000_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_2000_end_0 = const()[name = tensor("op_2000_end_0"), val = tensor([2, 77, 1, 64])]; tensor var_2000_end_mask_0 = const()[name = tensor("op_2000_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_6 = transpose(perm = k_31_perm_0, x = k_29_cast_fp16)[name = tensor("transpose_6")]; tensor var_2000_cast_fp16 = slice_by_index(begin = var_2000_begin_0, end = var_2000_end_0, end_mask = var_2000_end_mask_0, x = transpose_6)[name = tensor("op_2000_cast_fp16")]; tensor var_2004_begin_0 = const()[name = tensor("op_2004_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_2004_end_0 = const()[name = tensor("op_2004_end_0"), val = tensor([2, 77, 1, 128])]; tensor var_2004_end_mask_0 = const()[name = tensor("op_2004_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2004_cast_fp16 = slice_by_index(begin = var_2004_begin_0, end = var_2004_end_0, end_mask = var_2004_end_mask_0, x = transpose_6)[name = tensor("op_2004_cast_fp16")]; tensor var_2008_begin_0 = const()[name = tensor("op_2008_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_2008_end_0 = const()[name = tensor("op_2008_end_0"), val = tensor([2, 77, 1, 192])]; tensor var_2008_end_mask_0 = const()[name = tensor("op_2008_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2008_cast_fp16 = slice_by_index(begin = var_2008_begin_0, end = var_2008_end_0, end_mask = var_2008_end_mask_0, x = transpose_6)[name = tensor("op_2008_cast_fp16")]; tensor var_2012_begin_0 = const()[name = tensor("op_2012_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_2012_end_0 = const()[name = tensor("op_2012_end_0"), val = tensor([2, 77, 1, 256])]; tensor var_2012_end_mask_0 = const()[name = tensor("op_2012_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2012_cast_fp16 = slice_by_index(begin = var_2012_begin_0, end = var_2012_end_0, end_mask = var_2012_end_mask_0, x = transpose_6)[name = tensor("op_2012_cast_fp16")]; tensor var_2016_begin_0 = const()[name = tensor("op_2016_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_2016_end_0 = const()[name = tensor("op_2016_end_0"), val = tensor([2, 77, 1, 320])]; tensor var_2016_end_mask_0 = const()[name = tensor("op_2016_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2016_cast_fp16 = slice_by_index(begin = var_2016_begin_0, end = var_2016_end_0, end_mask = var_2016_end_mask_0, x = transpose_6)[name = tensor("op_2016_cast_fp16")]; tensor var_2020_begin_0 = const()[name = tensor("op_2020_begin_0"), val = tensor([0, 0, 0, 320])]; tensor var_2020_end_0 = const()[name = tensor("op_2020_end_0"), val = tensor([2, 77, 1, 384])]; tensor var_2020_end_mask_0 = const()[name = tensor("op_2020_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2020_cast_fp16 = slice_by_index(begin = var_2020_begin_0, end = var_2020_end_0, end_mask = var_2020_end_mask_0, x = transpose_6)[name = tensor("op_2020_cast_fp16")]; tensor var_2024_begin_0 = const()[name = tensor("op_2024_begin_0"), val = tensor([0, 0, 0, 384])]; tensor var_2024_end_0 = const()[name = tensor("op_2024_end_0"), val = tensor([2, 77, 1, 448])]; tensor var_2024_end_mask_0 = const()[name = tensor("op_2024_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2024_cast_fp16 = slice_by_index(begin = var_2024_begin_0, end = var_2024_end_0, end_mask = var_2024_end_mask_0, x = transpose_6)[name = tensor("op_2024_cast_fp16")]; tensor var_2028_begin_0 = const()[name = tensor("op_2028_begin_0"), val = tensor([0, 0, 0, 448])]; tensor var_2028_end_0 = const()[name = tensor("op_2028_end_0"), val = tensor([2, 77, 1, 512])]; tensor var_2028_end_mask_0 = const()[name = tensor("op_2028_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2028_cast_fp16 = slice_by_index(begin = var_2028_begin_0, end = var_2028_end_0, end_mask = var_2028_end_mask_0, x = transpose_6)[name = tensor("op_2028_cast_fp16")]; tensor var_2032_begin_0 = const()[name = tensor("op_2032_begin_0"), val = tensor([0, 0, 0, 512])]; tensor var_2032_end_0 = const()[name = tensor("op_2032_end_0"), val = tensor([2, 77, 1, 576])]; tensor var_2032_end_mask_0 = const()[name = tensor("op_2032_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2032_cast_fp16 = slice_by_index(begin = var_2032_begin_0, end = var_2032_end_0, end_mask = var_2032_end_mask_0, x = transpose_6)[name = tensor("op_2032_cast_fp16")]; tensor var_2036_begin_0 = const()[name = tensor("op_2036_begin_0"), val = tensor([0, 0, 0, 576])]; tensor var_2036_end_0 = const()[name = tensor("op_2036_end_0"), val = tensor([2, 77, 1, 640])]; tensor var_2036_end_mask_0 = const()[name = tensor("op_2036_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2036_cast_fp16 = slice_by_index(begin = var_2036_begin_0, end = var_2036_end_0, end_mask = var_2036_end_mask_0, x = transpose_6)[name = tensor("op_2036_cast_fp16")]; tensor var_2038_begin_0 = const()[name = tensor("op_2038_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_2038_end_0 = const()[name = tensor("op_2038_end_0"), val = tensor([2, 64, 1, 77])]; tensor var_2038_end_mask_0 = const()[name = tensor("op_2038_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2038_cast_fp16 = slice_by_index(begin = var_2038_begin_0, end = var_2038_end_0, end_mask = var_2038_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2038_cast_fp16")]; tensor var_2042_begin_0 = const()[name = tensor("op_2042_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_2042_end_0 = const()[name = tensor("op_2042_end_0"), val = tensor([2, 128, 1, 77])]; tensor var_2042_end_mask_0 = const()[name = tensor("op_2042_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2042_cast_fp16 = slice_by_index(begin = var_2042_begin_0, end = var_2042_end_0, end_mask = var_2042_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2042_cast_fp16")]; tensor var_2046_begin_0 = const()[name = tensor("op_2046_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_2046_end_0 = const()[name = tensor("op_2046_end_0"), val = tensor([2, 192, 1, 77])]; tensor var_2046_end_mask_0 = const()[name = tensor("op_2046_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2046_cast_fp16 = slice_by_index(begin = var_2046_begin_0, end = var_2046_end_0, end_mask = var_2046_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2046_cast_fp16")]; tensor var_2050_begin_0 = const()[name = tensor("op_2050_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_2050_end_0 = const()[name = tensor("op_2050_end_0"), val = tensor([2, 256, 1, 77])]; tensor var_2050_end_mask_0 = const()[name = tensor("op_2050_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2050_cast_fp16 = slice_by_index(begin = var_2050_begin_0, end = var_2050_end_0, end_mask = var_2050_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2050_cast_fp16")]; tensor var_2054_begin_0 = const()[name = tensor("op_2054_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_2054_end_0 = const()[name = tensor("op_2054_end_0"), val = tensor([2, 320, 1, 77])]; tensor var_2054_end_mask_0 = const()[name = tensor("op_2054_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2054_cast_fp16 = slice_by_index(begin = var_2054_begin_0, end = var_2054_end_0, end_mask = var_2054_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2054_cast_fp16")]; tensor var_2058_begin_0 = const()[name = tensor("op_2058_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_2058_end_0 = const()[name = tensor("op_2058_end_0"), val = tensor([2, 384, 1, 77])]; tensor var_2058_end_mask_0 = const()[name = tensor("op_2058_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2058_cast_fp16 = slice_by_index(begin = var_2058_begin_0, end = var_2058_end_0, end_mask = var_2058_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2058_cast_fp16")]; tensor var_2062_begin_0 = const()[name = tensor("op_2062_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_2062_end_0 = const()[name = tensor("op_2062_end_0"), val = tensor([2, 448, 1, 77])]; tensor var_2062_end_mask_0 = const()[name = tensor("op_2062_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2062_cast_fp16 = slice_by_index(begin = var_2062_begin_0, end = var_2062_end_0, end_mask = var_2062_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2062_cast_fp16")]; tensor var_2066_begin_0 = const()[name = tensor("op_2066_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_2066_end_0 = const()[name = tensor("op_2066_end_0"), val = tensor([2, 512, 1, 77])]; tensor var_2066_end_mask_0 = const()[name = tensor("op_2066_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2066_cast_fp16 = slice_by_index(begin = var_2066_begin_0, end = var_2066_end_0, end_mask = var_2066_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2066_cast_fp16")]; tensor var_2070_begin_0 = const()[name = tensor("op_2070_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_2070_end_0 = const()[name = tensor("op_2070_end_0"), val = tensor([2, 576, 1, 77])]; tensor var_2070_end_mask_0 = const()[name = tensor("op_2070_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2070_cast_fp16 = slice_by_index(begin = var_2070_begin_0, end = var_2070_end_0, end_mask = var_2070_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2070_cast_fp16")]; tensor var_2074_begin_0 = const()[name = tensor("op_2074_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_2074_end_0 = const()[name = tensor("op_2074_end_0"), val = tensor([2, 640, 1, 77])]; tensor var_2074_end_mask_0 = const()[name = tensor("op_2074_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2074_cast_fp16 = slice_by_index(begin = var_2074_begin_0, end = var_2074_end_0, end_mask = var_2074_end_mask_0, x = v_15_cast_fp16)[name = tensor("op_2074_cast_fp16")]; tensor var_2078_equation_0 = const()[name = tensor("op_2078_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2078_cast_fp16 = einsum(equation = var_2078_equation_0, values = (var_2000_cast_fp16, var_1957_cast_fp16))[name = tensor("op_2078_cast_fp16")]; tensor var_2079_to_fp16 = const()[name = tensor("op_2079_to_fp16"), val = tensor(0x1p-3)]; tensor aw_101_cast_fp16 = mul(x = var_2078_cast_fp16, y = var_2079_to_fp16)[name = tensor("aw_101_cast_fp16")]; tensor var_2082_equation_0 = const()[name = tensor("op_2082_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2082_cast_fp16 = einsum(equation = var_2082_equation_0, values = (var_2004_cast_fp16, var_1961_cast_fp16))[name = tensor("op_2082_cast_fp16")]; tensor var_2083_to_fp16 = const()[name = tensor("op_2083_to_fp16"), val = tensor(0x1p-3)]; tensor aw_103_cast_fp16 = mul(x = var_2082_cast_fp16, y = var_2083_to_fp16)[name = tensor("aw_103_cast_fp16")]; tensor var_2086_equation_0 = const()[name = tensor("op_2086_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2086_cast_fp16 = einsum(equation = var_2086_equation_0, values = (var_2008_cast_fp16, var_1965_cast_fp16))[name = tensor("op_2086_cast_fp16")]; tensor var_2087_to_fp16 = const()[name = tensor("op_2087_to_fp16"), val = tensor(0x1p-3)]; tensor aw_105_cast_fp16 = mul(x = var_2086_cast_fp16, y = var_2087_to_fp16)[name = tensor("aw_105_cast_fp16")]; tensor var_2090_equation_0 = const()[name = tensor("op_2090_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2090_cast_fp16 = einsum(equation = var_2090_equation_0, values = (var_2012_cast_fp16, var_1969_cast_fp16))[name = tensor("op_2090_cast_fp16")]; tensor var_2091_to_fp16 = const()[name = tensor("op_2091_to_fp16"), val = tensor(0x1p-3)]; tensor aw_107_cast_fp16 = mul(x = var_2090_cast_fp16, y = var_2091_to_fp16)[name = tensor("aw_107_cast_fp16")]; tensor var_2094_equation_0 = const()[name = tensor("op_2094_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2094_cast_fp16 = einsum(equation = var_2094_equation_0, values = (var_2016_cast_fp16, var_1973_cast_fp16))[name = tensor("op_2094_cast_fp16")]; tensor var_2095_to_fp16 = const()[name = tensor("op_2095_to_fp16"), val = tensor(0x1p-3)]; tensor aw_109_cast_fp16 = mul(x = var_2094_cast_fp16, y = var_2095_to_fp16)[name = tensor("aw_109_cast_fp16")]; tensor var_2098_equation_0 = const()[name = tensor("op_2098_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2098_cast_fp16 = einsum(equation = var_2098_equation_0, values = (var_2020_cast_fp16, var_1977_cast_fp16))[name = tensor("op_2098_cast_fp16")]; tensor var_2099_to_fp16 = const()[name = tensor("op_2099_to_fp16"), val = tensor(0x1p-3)]; tensor aw_111_cast_fp16 = mul(x = var_2098_cast_fp16, y = var_2099_to_fp16)[name = tensor("aw_111_cast_fp16")]; tensor var_2102_equation_0 = const()[name = tensor("op_2102_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2102_cast_fp16 = einsum(equation = var_2102_equation_0, values = (var_2024_cast_fp16, var_1981_cast_fp16))[name = tensor("op_2102_cast_fp16")]; tensor var_2103_to_fp16 = const()[name = tensor("op_2103_to_fp16"), val = tensor(0x1p-3)]; tensor aw_113_cast_fp16 = mul(x = var_2102_cast_fp16, y = var_2103_to_fp16)[name = tensor("aw_113_cast_fp16")]; tensor var_2106_equation_0 = const()[name = tensor("op_2106_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2106_cast_fp16 = einsum(equation = var_2106_equation_0, values = (var_2028_cast_fp16, var_1985_cast_fp16))[name = tensor("op_2106_cast_fp16")]; tensor var_2107_to_fp16 = const()[name = tensor("op_2107_to_fp16"), val = tensor(0x1p-3)]; tensor aw_115_cast_fp16 = mul(x = var_2106_cast_fp16, y = var_2107_to_fp16)[name = tensor("aw_115_cast_fp16")]; tensor var_2110_equation_0 = const()[name = tensor("op_2110_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2110_cast_fp16 = einsum(equation = var_2110_equation_0, values = (var_2032_cast_fp16, var_1989_cast_fp16))[name = tensor("op_2110_cast_fp16")]; tensor var_2111_to_fp16 = const()[name = tensor("op_2111_to_fp16"), val = tensor(0x1p-3)]; tensor aw_117_cast_fp16 = mul(x = var_2110_cast_fp16, y = var_2111_to_fp16)[name = tensor("aw_117_cast_fp16")]; tensor var_2114_equation_0 = const()[name = tensor("op_2114_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2114_cast_fp16 = einsum(equation = var_2114_equation_0, values = (var_2036_cast_fp16, var_1993_cast_fp16))[name = tensor("op_2114_cast_fp16")]; tensor var_2115_to_fp16 = const()[name = tensor("op_2115_to_fp16"), val = tensor(0x1p-3)]; tensor aw_119_cast_fp16 = mul(x = var_2114_cast_fp16, y = var_2115_to_fp16)[name = tensor("aw_119_cast_fp16")]; tensor var_2117_cast_fp16 = softmax(axis = var_984, x = aw_101_cast_fp16)[name = tensor("op_2117_cast_fp16")]; tensor var_2118_cast_fp16 = softmax(axis = var_984, x = aw_103_cast_fp16)[name = tensor("op_2118_cast_fp16")]; tensor var_2119_cast_fp16 = softmax(axis = var_984, x = aw_105_cast_fp16)[name = tensor("op_2119_cast_fp16")]; tensor var_2120_cast_fp16 = softmax(axis = var_984, x = aw_107_cast_fp16)[name = tensor("op_2120_cast_fp16")]; tensor var_2121_cast_fp16 = softmax(axis = var_984, x = aw_109_cast_fp16)[name = tensor("op_2121_cast_fp16")]; tensor var_2122_cast_fp16 = softmax(axis = var_984, x = aw_111_cast_fp16)[name = tensor("op_2122_cast_fp16")]; tensor var_2123_cast_fp16 = softmax(axis = var_984, x = aw_113_cast_fp16)[name = tensor("op_2123_cast_fp16")]; tensor var_2124_cast_fp16 = softmax(axis = var_984, x = aw_115_cast_fp16)[name = tensor("op_2124_cast_fp16")]; tensor var_2125_cast_fp16 = softmax(axis = var_984, x = aw_117_cast_fp16)[name = tensor("op_2125_cast_fp16")]; tensor var_2126_cast_fp16 = softmax(axis = var_984, x = aw_119_cast_fp16)[name = tensor("op_2126_cast_fp16")]; tensor var_2128_equation_0 = const()[name = tensor("op_2128_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2128_cast_fp16 = einsum(equation = var_2128_equation_0, values = (var_2038_cast_fp16, var_2117_cast_fp16))[name = tensor("op_2128_cast_fp16")]; tensor var_2130_equation_0 = const()[name = tensor("op_2130_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2130_cast_fp16 = einsum(equation = var_2130_equation_0, values = (var_2042_cast_fp16, var_2118_cast_fp16))[name = tensor("op_2130_cast_fp16")]; tensor var_2132_equation_0 = const()[name = tensor("op_2132_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2132_cast_fp16 = einsum(equation = var_2132_equation_0, values = (var_2046_cast_fp16, var_2119_cast_fp16))[name = tensor("op_2132_cast_fp16")]; tensor var_2134_equation_0 = const()[name = tensor("op_2134_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2134_cast_fp16 = einsum(equation = var_2134_equation_0, values = (var_2050_cast_fp16, var_2120_cast_fp16))[name = tensor("op_2134_cast_fp16")]; tensor var_2136_equation_0 = const()[name = tensor("op_2136_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2136_cast_fp16 = einsum(equation = var_2136_equation_0, values = (var_2054_cast_fp16, var_2121_cast_fp16))[name = tensor("op_2136_cast_fp16")]; tensor var_2138_equation_0 = const()[name = tensor("op_2138_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2138_cast_fp16 = einsum(equation = var_2138_equation_0, values = (var_2058_cast_fp16, var_2122_cast_fp16))[name = tensor("op_2138_cast_fp16")]; tensor var_2140_equation_0 = const()[name = tensor("op_2140_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2140_cast_fp16 = einsum(equation = var_2140_equation_0, values = (var_2062_cast_fp16, var_2123_cast_fp16))[name = tensor("op_2140_cast_fp16")]; tensor var_2142_equation_0 = const()[name = tensor("op_2142_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2142_cast_fp16 = einsum(equation = var_2142_equation_0, values = (var_2066_cast_fp16, var_2124_cast_fp16))[name = tensor("op_2142_cast_fp16")]; tensor var_2144_equation_0 = const()[name = tensor("op_2144_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2144_cast_fp16 = einsum(equation = var_2144_equation_0, values = (var_2070_cast_fp16, var_2125_cast_fp16))[name = tensor("op_2144_cast_fp16")]; tensor var_2146_equation_0 = const()[name = tensor("op_2146_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2146_cast_fp16 = einsum(equation = var_2146_equation_0, values = (var_2074_cast_fp16, var_2126_cast_fp16))[name = tensor("op_2146_cast_fp16")]; tensor input_107_interleave_0 = const()[name = tensor("input_107_interleave_0"), val = tensor(false)]; tensor input_107_cast_fp16 = concat(axis = var_984, interleave = input_107_interleave_0, values = (var_2128_cast_fp16, var_2130_cast_fp16, var_2132_cast_fp16, var_2134_cast_fp16, var_2136_cast_fp16, var_2138_cast_fp16, var_2140_cast_fp16, var_2142_cast_fp16, var_2144_cast_fp16, var_2146_cast_fp16))[name = tensor("input_107_cast_fp16")]; tensor var_2152 = const()[name = tensor("op_2152"), val = tensor([1, 1])]; tensor var_2154 = const()[name = tensor("op_2154"), val = tensor([1, 1])]; tensor var_2156_pad_type_0 = const()[name = tensor("op_2156_pad_type_0"), val = tensor("custom")]; tensor var_2156_pad_0 = const()[name = tensor("op_2156_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(81931200)))]; tensor down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82750464)))]; tensor var_2156_cast_fp16 = conv(bias = down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_2154, groups = var_984, pad = var_2156_pad_0, pad_type = var_2156_pad_type_0, strides = var_2152, weight = down_blocks_1_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_107_cast_fp16)[name = tensor("op_2156_cast_fp16")]; tensor inputs_23_cast_fp16 = add(x = var_2156_cast_fp16, y = inputs_21_cast_fp16)[name = tensor("inputs_23_cast_fp16")]; tensor var_2160 = const()[name = tensor("op_2160"), val = tensor([1])]; tensor channels_mean_23_cast_fp16 = reduce_mean(axes = var_2160, keep_dims = var_979, x = inputs_23_cast_fp16)[name = tensor("channels_mean_23_cast_fp16")]; tensor zero_mean_23_cast_fp16 = sub(x = inputs_23_cast_fp16, y = channels_mean_23_cast_fp16)[name = tensor("zero_mean_23_cast_fp16")]; tensor zero_mean_sq_23_cast_fp16 = mul(x = zero_mean_23_cast_fp16, y = zero_mean_23_cast_fp16)[name = tensor("zero_mean_sq_23_cast_fp16")]; tensor var_2164 = const()[name = tensor("op_2164"), val = tensor([1])]; tensor var_2165_cast_fp16 = reduce_mean(axes = var_2164, keep_dims = var_979, x = zero_mean_sq_23_cast_fp16)[name = tensor("op_2165_cast_fp16")]; tensor var_2166_to_fp16 = const()[name = tensor("op_2166_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2167_cast_fp16 = add(x = var_2165_cast_fp16, y = var_2166_to_fp16)[name = tensor("op_2167_cast_fp16")]; tensor denom_23_epsilon_0_to_fp16 = const()[name = tensor("denom_23_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_23_cast_fp16 = rsqrt(epsilon = denom_23_epsilon_0_to_fp16, x = var_2167_cast_fp16)[name = tensor("denom_23_cast_fp16")]; tensor out_23_cast_fp16 = mul(x = zero_mean_23_cast_fp16, y = denom_23_cast_fp16)[name = tensor("out_23_cast_fp16")]; tensor var_2171_to_fp16 = const()[name = tensor("op_2171_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82751808)))]; tensor var_2172_cast_fp16 = add(x = out_23_cast_fp16, y = var_2171_to_fp16)[name = tensor("op_2172_cast_fp16")]; tensor var_2174_to_fp16 = const()[name = tensor("op_2174_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82753152)))]; tensor input_109_cast_fp16 = mul(x = var_2172_cast_fp16, y = var_2174_to_fp16)[name = tensor("input_109_cast_fp16")]; tensor var_2182 = const()[name = tensor("op_2182"), val = tensor([1, 1])]; tensor var_2184 = const()[name = tensor("op_2184"), val = tensor([1, 1])]; tensor var_2186_pad_type_0 = const()[name = tensor("op_2186_pad_type_0"), val = tensor("custom")]; tensor var_2186_pad_0 = const()[name = tensor("op_2186_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(82754496)))]; tensor down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89308160)))]; tensor var_2186_cast_fp16 = conv(bias = down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_2184, groups = var_984, pad = var_2186_pad_0, pad_type = var_2186_pad_type_0, strides = var_2182, weight = down_blocks_1_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_109_cast_fp16)[name = tensor("op_2186_cast_fp16")]; tensor var_2187_split_sizes_0 = const()[name = tensor("op_2187_split_sizes_0"), val = tensor([2560, 2560])]; tensor var_2187_axis_0 = const()[name = tensor("op_2187_axis_0"), val = tensor(1)]; tensor var_2187_cast_fp16_0, tensor var_2187_cast_fp16_1 = split(axis = var_2187_axis_0, split_sizes = var_2187_split_sizes_0, x = var_2186_cast_fp16)[name = tensor("op_2187_cast_fp16")]; tensor var_2189_mode_0 = const()[name = tensor("op_2189_mode_0"), val = tensor("EXACT")]; tensor var_2189_cast_fp16 = gelu(mode = var_2189_mode_0, x = var_2187_cast_fp16_1)[name = tensor("op_2189_cast_fp16")]; tensor input_111_cast_fp16 = mul(x = var_2187_cast_fp16_0, y = var_2189_cast_fp16)[name = tensor("input_111_cast_fp16")]; tensor var_2193 = const()[name = tensor("op_2193"), val = tensor([1, 1])]; tensor var_2195 = const()[name = tensor("op_2195"), val = tensor([1, 1])]; tensor var_2197_pad_type_0 = const()[name = tensor("op_2197_pad_type_0"), val = tensor("custom")]; tensor var_2197_pad_0 = const()[name = tensor("op_2197_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89318464)))]; tensor down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(92595328)))]; tensor var_2197_cast_fp16 = conv(bias = down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_2195, groups = var_984, pad = var_2197_pad_0, pad_type = var_2197_pad_type_0, strides = var_2193, weight = down_blocks_1_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_111_cast_fp16)[name = tensor("op_2197_cast_fp16")]; tensor hidden_states_69_cast_fp16 = add(x = var_2197_cast_fp16, y = inputs_23_cast_fp16)[name = tensor("hidden_states_69_cast_fp16")]; tensor var_2199 = const()[name = tensor("op_2199"), val = tensor([2, 640, 24, 24])]; tensor input_113_cast_fp16 = reshape(shape = var_2199, x = hidden_states_69_cast_fp16)[name = tensor("input_113_cast_fp16")]; tensor var_2203 = const()[name = tensor("op_2203"), val = tensor([1, 1])]; tensor var_2205 = const()[name = tensor("op_2205"), val = tensor([1, 1])]; tensor hidden_states_71_pad_type_0 = const()[name = tensor("hidden_states_71_pad_type_0"), val = tensor("custom")]; tensor hidden_states_71_pad_0 = const()[name = tensor("hidden_states_71_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_1_attentions_1_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(92596672)))]; tensor down_blocks_1_attentions_1_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_1_attentions_1_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93415936)))]; tensor hidden_states_71_cast_fp16 = conv(bias = down_blocks_1_attentions_1_proj_out_bias_to_fp16, dilations = var_2205, groups = var_984, pad = hidden_states_71_pad_0, pad_type = hidden_states_71_pad_type_0, strides = var_2203, weight = down_blocks_1_attentions_1_proj_out_weight_to_fp16, x = input_113_cast_fp16)[name = tensor("hidden_states_71_cast_fp16")]; tensor input_115_cast_fp16_1 = add(x = hidden_states_71_cast_fp16, y = hidden_states_59_cast_fp16)[name = tensor("input_115_cast_fp16")]; tensor var_2212 = const()[name = tensor("op_2212"), val = tensor([2, 2])]; tensor var_2214 = const()[name = tensor("op_2214"), val = tensor([1, 1])]; tensor input_117_pad_type_0 = const()[name = tensor("input_117_pad_type_0"), val = tensor("custom")]; tensor input_117_pad_0 = const()[name = tensor("input_117_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_1_downsamplers_0_conv_weight_to_fp16 = const()[name = tensor("down_blocks_1_downsamplers_0_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93417280)))]; tensor down_blocks_1_downsamplers_0_conv_bias_to_fp16 = const()[name = tensor("down_blocks_1_downsamplers_0_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100790144)))]; tensor input_117_cast_fp16_1 = conv(bias = down_blocks_1_downsamplers_0_conv_bias_to_fp16, dilations = var_2214, groups = var_984, pad = input_117_pad_0, pad_type = input_117_pad_type_0, strides = var_2212, weight = down_blocks_1_downsamplers_0_conv_weight_to_fp16, x = input_115_cast_fp16_1)[name = tensor("input_117_cast_fp16")]; tensor var_2249 = const()[name = tensor("op_2249"), val = tensor(true)]; tensor var_2254 = const()[name = tensor("op_2254"), val = tensor(1)]; tensor reshape_48_shape_0 = const()[name = tensor("reshape_48_shape_0"), val = tensor([2, 32, 20, 12, 12])]; tensor reshape_48_cast_fp16 = reshape(shape = reshape_48_shape_0, x = input_117_cast_fp16_1)[name = tensor("reshape_48_cast_fp16")]; tensor reduce_mean_36_axes_0 = const()[name = tensor("reduce_mean_36_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_36_keep_dims_0 = const()[name = tensor("reduce_mean_36_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_36_cast_fp16 = reduce_mean(axes = reduce_mean_36_axes_0, keep_dims = reduce_mean_36_keep_dims_0, x = reshape_48_cast_fp16)[name = tensor("reduce_mean_36_cast_fp16")]; tensor sub_24_cast_fp16 = sub(x = reshape_48_cast_fp16, y = reduce_mean_36_cast_fp16)[name = tensor("sub_24_cast_fp16")]; tensor square_12_cast_fp16 = square(x = sub_24_cast_fp16)[name = tensor("square_12_cast_fp16")]; tensor reduce_mean_38_axes_0 = const()[name = tensor("reduce_mean_38_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_38_keep_dims_0 = const()[name = tensor("reduce_mean_38_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_38_cast_fp16 = reduce_mean(axes = reduce_mean_38_axes_0, keep_dims = reduce_mean_38_keep_dims_0, x = square_12_cast_fp16)[name = tensor("reduce_mean_38_cast_fp16")]; tensor add_24_y_0_to_fp16 = const()[name = tensor("add_24_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_24_cast_fp16 = add(x = reduce_mean_38_cast_fp16, y = add_24_y_0_to_fp16)[name = tensor("add_24_cast_fp16")]; tensor sqrt_12_cast_fp16 = sqrt(x = add_24_cast_fp16)[name = tensor("sqrt_12_cast_fp16")]; tensor real_div_12_cast_fp16 = real_div(x = sub_24_cast_fp16, y = sqrt_12_cast_fp16)[name = tensor("real_div_12_cast_fp16")]; tensor reshape_49_shape_0 = const()[name = tensor("reshape_49_shape_0"), val = tensor([2, 640, 12, 12])]; tensor reshape_49_cast_fp16 = reshape(shape = reshape_49_shape_0, x = real_div_12_cast_fp16)[name = tensor("reshape_49_cast_fp16")]; tensor add_25_gamma_0_to_fp16 = const()[name = tensor("add_25_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100791488)))]; tensor add_25_beta_0_to_fp16 = const()[name = tensor("add_25_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100792832)))]; tensor add_25_epsilon_0_to_fp16 = const()[name = tensor("add_25_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_25_cast_fp16 = batch_norm(beta = add_25_beta_0_to_fp16, epsilon = add_25_epsilon_0_to_fp16, gamma = add_25_gamma_0_to_fp16, mean = add_15_mean_0_to_fp16, variance = add_15_variance_0_to_fp16, x = reshape_49_cast_fp16)[name = tensor("add_25_cast_fp16")]; tensor input_121_cast_fp16 = silu(x = add_25_cast_fp16)[name = tensor("input_121_cast_fp16")]; tensor var_2277 = const()[name = tensor("op_2277"), val = tensor([1, 1])]; tensor var_2279 = const()[name = tensor("op_2279"), val = tensor([1, 1])]; tensor hidden_states_73_pad_type_0 = const()[name = tensor("hidden_states_73_pad_type_0"), val = tensor("custom")]; tensor hidden_states_73_pad_0 = const()[name = tensor("hidden_states_73_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_2_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100794176)))]; tensor down_blocks_2_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(115539840)))]; tensor hidden_states_73_cast_fp16 = conv(bias = down_blocks_2_resnets_0_conv1_bias_to_fp16, dilations = var_2279, groups = var_2254, pad = hidden_states_73_pad_0, pad_type = hidden_states_73_pad_type_0, strides = var_2277, weight = down_blocks_2_resnets_0_conv1_weight_to_fp16, x = input_121_cast_fp16)[name = tensor("hidden_states_73_cast_fp16")]; tensor var_2285 = const()[name = tensor("op_2285"), val = tensor([1, 1])]; tensor var_2287 = const()[name = tensor("op_2287"), val = tensor([1, 1])]; tensor temb_9_pad_type_0 = const()[name = tensor("temb_9_pad_type_0"), val = tensor("custom")]; tensor temb_9_pad_0 = const()[name = tensor("temb_9_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(115542464)))]; tensor down_blocks_2_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118819328)))]; tensor temb_9_cast_fp16 = conv(bias = down_blocks_2_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_2287, groups = var_2254, pad = temb_9_pad_0, pad_type = temb_9_pad_type_0, strides = var_2285, weight = down_blocks_2_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_9_cast_fp16")]; tensor input_125_cast_fp16 = add(x = hidden_states_73_cast_fp16, y = temb_9_cast_fp16)[name = tensor("input_125_cast_fp16")]; tensor reshape_52_shape_0 = const()[name = tensor("reshape_52_shape_0"), val = tensor([2, 32, 40, 12, 12])]; tensor reshape_52_cast_fp16 = reshape(shape = reshape_52_shape_0, x = input_125_cast_fp16)[name = tensor("reshape_52_cast_fp16")]; tensor reduce_mean_39_axes_0 = const()[name = tensor("reduce_mean_39_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_39_keep_dims_0 = const()[name = tensor("reduce_mean_39_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_39_cast_fp16 = reduce_mean(axes = reduce_mean_39_axes_0, keep_dims = reduce_mean_39_keep_dims_0, x = reshape_52_cast_fp16)[name = tensor("reduce_mean_39_cast_fp16")]; tensor sub_26_cast_fp16 = sub(x = reshape_52_cast_fp16, y = reduce_mean_39_cast_fp16)[name = tensor("sub_26_cast_fp16")]; tensor square_13_cast_fp16 = square(x = sub_26_cast_fp16)[name = tensor("square_13_cast_fp16")]; tensor reduce_mean_41_axes_0 = const()[name = tensor("reduce_mean_41_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_41_keep_dims_0 = const()[name = tensor("reduce_mean_41_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_41_cast_fp16 = reduce_mean(axes = reduce_mean_41_axes_0, keep_dims = reduce_mean_41_keep_dims_0, x = square_13_cast_fp16)[name = tensor("reduce_mean_41_cast_fp16")]; tensor add_26_y_0_to_fp16 = const()[name = tensor("add_26_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_26_cast_fp16 = add(x = reduce_mean_41_cast_fp16, y = add_26_y_0_to_fp16)[name = tensor("add_26_cast_fp16")]; tensor sqrt_13_cast_fp16 = sqrt(x = add_26_cast_fp16)[name = tensor("sqrt_13_cast_fp16")]; tensor real_div_13_cast_fp16 = real_div(x = sub_26_cast_fp16, y = sqrt_13_cast_fp16)[name = tensor("real_div_13_cast_fp16")]; tensor reshape_53_shape_0 = const()[name = tensor("reshape_53_shape_0"), val = tensor([2, 1280, 12, 12])]; tensor reshape_53_cast_fp16 = reshape(shape = reshape_53_shape_0, x = real_div_13_cast_fp16)[name = tensor("reshape_53_cast_fp16")]; tensor add_27_mean_0_to_fp16 = const()[name = tensor("add_27_mean_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118821952)))]; tensor add_27_variance_0_to_fp16 = const()[name = tensor("add_27_variance_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118824576)))]; tensor add_27_gamma_0_to_fp16 = const()[name = tensor("add_27_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118827200)))]; tensor add_27_beta_0_to_fp16 = const()[name = tensor("add_27_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118829824)))]; tensor add_27_epsilon_0_to_fp16 = const()[name = tensor("add_27_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_27_cast_fp16 = batch_norm(beta = add_27_beta_0_to_fp16, epsilon = add_27_epsilon_0_to_fp16, gamma = add_27_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_53_cast_fp16)[name = tensor("add_27_cast_fp16")]; tensor input_129_cast_fp16 = silu(x = add_27_cast_fp16)[name = tensor("input_129_cast_fp16")]; tensor var_2297 = const()[name = tensor("op_2297"), val = tensor([1, 1])]; tensor var_2299 = const()[name = tensor("op_2299"), val = tensor([1, 1])]; tensor hidden_states_75_pad_type_0 = const()[name = tensor("hidden_states_75_pad_type_0"), val = tensor("custom")]; tensor hidden_states_75_pad_0 = const()[name = tensor("hidden_states_75_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_2_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(118832448)))]; tensor down_blocks_2_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148323712)))]; tensor hidden_states_75_cast_fp16 = conv(bias = down_blocks_2_resnets_0_conv2_bias_to_fp16, dilations = var_2299, groups = var_2254, pad = hidden_states_75_pad_0, pad_type = hidden_states_75_pad_type_0, strides = var_2297, weight = down_blocks_2_resnets_0_conv2_weight_to_fp16, x = input_129_cast_fp16)[name = tensor("hidden_states_75_cast_fp16")]; tensor var_2304 = const()[name = tensor("op_2304"), val = tensor([1, 1])]; tensor var_2306 = const()[name = tensor("op_2306"), val = tensor([1, 1])]; tensor x_3_pad_type_0 = const()[name = tensor("x_3_pad_type_0"), val = tensor("custom")]; tensor x_3_pad_0 = const()[name = tensor("x_3_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_resnets_0_conv_shortcut_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(148326336)))]; tensor down_blocks_2_resnets_0_conv_shortcut_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_0_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(149964800)))]; tensor x_3_cast_fp16 = conv(bias = down_blocks_2_resnets_0_conv_shortcut_bias_to_fp16, dilations = var_2306, groups = var_2254, pad = x_3_pad_0, pad_type = x_3_pad_type_0, strides = var_2304, weight = down_blocks_2_resnets_0_conv_shortcut_weight_to_fp16, x = input_117_cast_fp16_1)[name = tensor("x_3_cast_fp16")]; tensor hidden_states_77_cast_fp16 = add(x = x_3_cast_fp16, y = hidden_states_75_cast_fp16)[name = tensor("hidden_states_77_cast_fp16")]; tensor reshape_56_shape_0 = const()[name = tensor("reshape_56_shape_0"), val = tensor([2, 32, 40, 12, 12])]; tensor reshape_56_cast_fp16 = reshape(shape = reshape_56_shape_0, x = hidden_states_77_cast_fp16)[name = tensor("reshape_56_cast_fp16")]; tensor reduce_mean_42_axes_0 = const()[name = tensor("reduce_mean_42_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_42_keep_dims_0 = const()[name = tensor("reduce_mean_42_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_42_cast_fp16 = reduce_mean(axes = reduce_mean_42_axes_0, keep_dims = reduce_mean_42_keep_dims_0, x = reshape_56_cast_fp16)[name = tensor("reduce_mean_42_cast_fp16")]; tensor sub_28_cast_fp16 = sub(x = reshape_56_cast_fp16, y = reduce_mean_42_cast_fp16)[name = tensor("sub_28_cast_fp16")]; tensor square_14_cast_fp16 = square(x = sub_28_cast_fp16)[name = tensor("square_14_cast_fp16")]; tensor reduce_mean_44_axes_0 = const()[name = tensor("reduce_mean_44_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_44_keep_dims_0 = const()[name = tensor("reduce_mean_44_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_44_cast_fp16 = reduce_mean(axes = reduce_mean_44_axes_0, keep_dims = reduce_mean_44_keep_dims_0, x = square_14_cast_fp16)[name = tensor("reduce_mean_44_cast_fp16")]; tensor add_28_y_0_to_fp16 = const()[name = tensor("add_28_y_0_to_fp16"), val = tensor(0x1.1p-20)]; tensor add_28_cast_fp16 = add(x = reduce_mean_44_cast_fp16, y = add_28_y_0_to_fp16)[name = tensor("add_28_cast_fp16")]; tensor sqrt_14_cast_fp16 = sqrt(x = add_28_cast_fp16)[name = tensor("sqrt_14_cast_fp16")]; tensor real_div_14_cast_fp16 = real_div(x = sub_28_cast_fp16, y = sqrt_14_cast_fp16)[name = tensor("real_div_14_cast_fp16")]; tensor reshape_57_shape_0 = const()[name = tensor("reshape_57_shape_0"), val = tensor([2, 1280, 12, 12])]; tensor reshape_57_cast_fp16 = reshape(shape = reshape_57_shape_0, x = real_div_14_cast_fp16)[name = tensor("reshape_57_cast_fp16")]; tensor add_29_gamma_0_to_fp16 = const()[name = tensor("add_29_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(149967424)))]; tensor add_29_beta_0_to_fp16 = const()[name = tensor("add_29_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(149970048)))]; tensor add_29_epsilon_0_to_fp16 = const()[name = tensor("add_29_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_29_cast_fp16 = batch_norm(beta = add_29_beta_0_to_fp16, epsilon = add_29_epsilon_0_to_fp16, gamma = add_29_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_57_cast_fp16)[name = tensor("add_29_cast_fp16")]; tensor var_2326 = const()[name = tensor("op_2326"), val = tensor([1, 1])]; tensor var_2328 = const()[name = tensor("op_2328"), val = tensor([1, 1])]; tensor hidden_states_79_pad_type_0 = const()[name = tensor("hidden_states_79_pad_type_0"), val = tensor("custom")]; tensor hidden_states_79_pad_0 = const()[name = tensor("hidden_states_79_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(149972672)))]; tensor down_blocks_2_attentions_0_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153249536)))]; tensor hidden_states_79_cast_fp16 = conv(bias = down_blocks_2_attentions_0_proj_in_bias_to_fp16, dilations = var_2328, groups = var_2254, pad = hidden_states_79_pad_0, pad_type = hidden_states_79_pad_type_0, strides = var_2326, weight = down_blocks_2_attentions_0_proj_in_weight_to_fp16, x = add_29_cast_fp16)[name = tensor("hidden_states_79_cast_fp16")]; tensor var_2333 = const()[name = tensor("op_2333"), val = tensor([2, 1280, 1, 144])]; tensor inputs_25_cast_fp16 = reshape(shape = var_2333, x = hidden_states_79_cast_fp16)[name = tensor("inputs_25_cast_fp16")]; tensor var_2343 = const()[name = tensor("op_2343"), val = tensor([1])]; tensor channels_mean_25_cast_fp16 = reduce_mean(axes = var_2343, keep_dims = var_2249, x = inputs_25_cast_fp16)[name = tensor("channels_mean_25_cast_fp16")]; tensor zero_mean_25_cast_fp16 = sub(x = inputs_25_cast_fp16, y = channels_mean_25_cast_fp16)[name = tensor("zero_mean_25_cast_fp16")]; tensor zero_mean_sq_25_cast_fp16 = mul(x = zero_mean_25_cast_fp16, y = zero_mean_25_cast_fp16)[name = tensor("zero_mean_sq_25_cast_fp16")]; tensor var_2347 = const()[name = tensor("op_2347"), val = tensor([1])]; tensor var_2348_cast_fp16 = reduce_mean(axes = var_2347, keep_dims = var_2249, x = zero_mean_sq_25_cast_fp16)[name = tensor("op_2348_cast_fp16")]; tensor var_2349_to_fp16 = const()[name = tensor("op_2349_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2350_cast_fp16 = add(x = var_2348_cast_fp16, y = var_2349_to_fp16)[name = tensor("op_2350_cast_fp16")]; tensor denom_25_epsilon_0_to_fp16 = const()[name = tensor("denom_25_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_25_cast_fp16 = rsqrt(epsilon = denom_25_epsilon_0_to_fp16, x = var_2350_cast_fp16)[name = tensor("denom_25_cast_fp16")]; tensor out_25_cast_fp16 = mul(x = zero_mean_25_cast_fp16, y = denom_25_cast_fp16)[name = tensor("out_25_cast_fp16")]; tensor var_2354_to_fp16 = const()[name = tensor("op_2354_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153252160)))]; tensor var_2355_cast_fp16 = add(x = out_25_cast_fp16, y = var_2354_to_fp16)[name = tensor("op_2355_cast_fp16")]; tensor var_2357_to_fp16 = const()[name = tensor("op_2357_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153254784)))]; tensor hidden_states_81_cast_fp16 = mul(x = var_2355_cast_fp16, y = var_2357_to_fp16)[name = tensor("hidden_states_81_cast_fp16")]; tensor var_2364 = const()[name = tensor("op_2364"), val = tensor([1, 1])]; tensor var_2366 = const()[name = tensor("op_2366"), val = tensor([1, 1])]; tensor q_17_pad_type_0 = const()[name = tensor("q_17_pad_type_0"), val = tensor("custom")]; tensor q_17_pad_0 = const()[name = tensor("q_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(153257408)))]; tensor q_17_cast_fp16 = conv(dilations = var_2366, groups = var_2254, pad = q_17_pad_0, pad_type = q_17_pad_type_0, strides = var_2364, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_81_cast_fp16)[name = tensor("q_17_cast_fp16")]; tensor var_2370 = const()[name = tensor("op_2370"), val = tensor([1, 1])]; tensor var_2372 = const()[name = tensor("op_2372"), val = tensor([1, 1])]; tensor k_33_pad_type_0 = const()[name = tensor("k_33_pad_type_0"), val = tensor("custom")]; tensor k_33_pad_0 = const()[name = tensor("k_33_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(156534272)))]; tensor k_33_cast_fp16 = conv(dilations = var_2372, groups = var_2254, pad = k_33_pad_0, pad_type = k_33_pad_type_0, strides = var_2370, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_81_cast_fp16)[name = tensor("k_33_cast_fp16")]; tensor var_2376 = const()[name = tensor("op_2376"), val = tensor([1, 1])]; tensor var_2378 = const()[name = tensor("op_2378"), val = tensor([1, 1])]; tensor v_17_pad_type_0 = const()[name = tensor("v_17_pad_type_0"), val = tensor("custom")]; tensor v_17_pad_0 = const()[name = tensor("v_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(159811136)))]; tensor v_17_cast_fp16 = conv(dilations = var_2378, groups = var_2254, pad = v_17_pad_0, pad_type = v_17_pad_type_0, strides = var_2376, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_81_cast_fp16)[name = tensor("v_17_cast_fp16")]; tensor var_2382_begin_0 = const()[name = tensor("op_2382_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_2382_end_0 = const()[name = tensor("op_2382_end_0"), val = tensor([2, 64, 1, 144])]; tensor var_2382_end_mask_0 = const()[name = tensor("op_2382_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2382_cast_fp16 = slice_by_index(begin = var_2382_begin_0, end = var_2382_end_0, end_mask = var_2382_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2382_cast_fp16")]; tensor var_2386_begin_0 = const()[name = tensor("op_2386_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_2386_end_0 = const()[name = tensor("op_2386_end_0"), val = tensor([2, 128, 1, 144])]; tensor var_2386_end_mask_0 = const()[name = tensor("op_2386_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2386_cast_fp16 = slice_by_index(begin = var_2386_begin_0, end = var_2386_end_0, end_mask = var_2386_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2386_cast_fp16")]; tensor var_2390_begin_0 = const()[name = tensor("op_2390_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_2390_end_0 = const()[name = tensor("op_2390_end_0"), val = tensor([2, 192, 1, 144])]; tensor var_2390_end_mask_0 = const()[name = tensor("op_2390_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2390_cast_fp16 = slice_by_index(begin = var_2390_begin_0, end = var_2390_end_0, end_mask = var_2390_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2390_cast_fp16")]; tensor var_2394_begin_0 = const()[name = tensor("op_2394_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_2394_end_0 = const()[name = tensor("op_2394_end_0"), val = tensor([2, 256, 1, 144])]; tensor var_2394_end_mask_0 = const()[name = tensor("op_2394_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2394_cast_fp16 = slice_by_index(begin = var_2394_begin_0, end = var_2394_end_0, end_mask = var_2394_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2394_cast_fp16")]; tensor var_2398_begin_0 = const()[name = tensor("op_2398_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_2398_end_0 = const()[name = tensor("op_2398_end_0"), val = tensor([2, 320, 1, 144])]; tensor var_2398_end_mask_0 = const()[name = tensor("op_2398_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2398_cast_fp16 = slice_by_index(begin = var_2398_begin_0, end = var_2398_end_0, end_mask = var_2398_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2398_cast_fp16")]; tensor var_2402_begin_0 = const()[name = tensor("op_2402_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_2402_end_0 = const()[name = tensor("op_2402_end_0"), val = tensor([2, 384, 1, 144])]; tensor var_2402_end_mask_0 = const()[name = tensor("op_2402_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2402_cast_fp16 = slice_by_index(begin = var_2402_begin_0, end = var_2402_end_0, end_mask = var_2402_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2402_cast_fp16")]; tensor var_2406_begin_0 = const()[name = tensor("op_2406_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_2406_end_0 = const()[name = tensor("op_2406_end_0"), val = tensor([2, 448, 1, 144])]; tensor var_2406_end_mask_0 = const()[name = tensor("op_2406_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2406_cast_fp16 = slice_by_index(begin = var_2406_begin_0, end = var_2406_end_0, end_mask = var_2406_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2406_cast_fp16")]; tensor var_2410_begin_0 = const()[name = tensor("op_2410_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_2410_end_0 = const()[name = tensor("op_2410_end_0"), val = tensor([2, 512, 1, 144])]; tensor var_2410_end_mask_0 = const()[name = tensor("op_2410_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2410_cast_fp16 = slice_by_index(begin = var_2410_begin_0, end = var_2410_end_0, end_mask = var_2410_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2410_cast_fp16")]; tensor var_2414_begin_0 = const()[name = tensor("op_2414_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_2414_end_0 = const()[name = tensor("op_2414_end_0"), val = tensor([2, 576, 1, 144])]; tensor var_2414_end_mask_0 = const()[name = tensor("op_2414_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2414_cast_fp16 = slice_by_index(begin = var_2414_begin_0, end = var_2414_end_0, end_mask = var_2414_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2414_cast_fp16")]; tensor var_2418_begin_0 = const()[name = tensor("op_2418_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_2418_end_0 = const()[name = tensor("op_2418_end_0"), val = tensor([2, 640, 1, 144])]; tensor var_2418_end_mask_0 = const()[name = tensor("op_2418_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2418_cast_fp16 = slice_by_index(begin = var_2418_begin_0, end = var_2418_end_0, end_mask = var_2418_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2418_cast_fp16")]; tensor var_2422_begin_0 = const()[name = tensor("op_2422_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_2422_end_0 = const()[name = tensor("op_2422_end_0"), val = tensor([2, 704, 1, 144])]; tensor var_2422_end_mask_0 = const()[name = tensor("op_2422_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2422_cast_fp16 = slice_by_index(begin = var_2422_begin_0, end = var_2422_end_0, end_mask = var_2422_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2422_cast_fp16")]; tensor var_2426_begin_0 = const()[name = tensor("op_2426_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_2426_end_0 = const()[name = tensor("op_2426_end_0"), val = tensor([2, 768, 1, 144])]; tensor var_2426_end_mask_0 = const()[name = tensor("op_2426_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2426_cast_fp16 = slice_by_index(begin = var_2426_begin_0, end = var_2426_end_0, end_mask = var_2426_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2426_cast_fp16")]; tensor var_2430_begin_0 = const()[name = tensor("op_2430_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_2430_end_0 = const()[name = tensor("op_2430_end_0"), val = tensor([2, 832, 1, 144])]; tensor var_2430_end_mask_0 = const()[name = tensor("op_2430_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2430_cast_fp16 = slice_by_index(begin = var_2430_begin_0, end = var_2430_end_0, end_mask = var_2430_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2430_cast_fp16")]; tensor var_2434_begin_0 = const()[name = tensor("op_2434_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_2434_end_0 = const()[name = tensor("op_2434_end_0"), val = tensor([2, 896, 1, 144])]; tensor var_2434_end_mask_0 = const()[name = tensor("op_2434_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2434_cast_fp16 = slice_by_index(begin = var_2434_begin_0, end = var_2434_end_0, end_mask = var_2434_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2434_cast_fp16")]; tensor var_2438_begin_0 = const()[name = tensor("op_2438_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_2438_end_0 = const()[name = tensor("op_2438_end_0"), val = tensor([2, 960, 1, 144])]; tensor var_2438_end_mask_0 = const()[name = tensor("op_2438_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2438_cast_fp16 = slice_by_index(begin = var_2438_begin_0, end = var_2438_end_0, end_mask = var_2438_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2438_cast_fp16")]; tensor var_2442_begin_0 = const()[name = tensor("op_2442_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_2442_end_0 = const()[name = tensor("op_2442_end_0"), val = tensor([2, 1024, 1, 144])]; tensor var_2442_end_mask_0 = const()[name = tensor("op_2442_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2442_cast_fp16 = slice_by_index(begin = var_2442_begin_0, end = var_2442_end_0, end_mask = var_2442_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2442_cast_fp16")]; tensor var_2446_begin_0 = const()[name = tensor("op_2446_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_2446_end_0 = const()[name = tensor("op_2446_end_0"), val = tensor([2, 1088, 1, 144])]; tensor var_2446_end_mask_0 = const()[name = tensor("op_2446_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2446_cast_fp16 = slice_by_index(begin = var_2446_begin_0, end = var_2446_end_0, end_mask = var_2446_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2446_cast_fp16")]; tensor var_2450_begin_0 = const()[name = tensor("op_2450_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_2450_end_0 = const()[name = tensor("op_2450_end_0"), val = tensor([2, 1152, 1, 144])]; tensor var_2450_end_mask_0 = const()[name = tensor("op_2450_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2450_cast_fp16 = slice_by_index(begin = var_2450_begin_0, end = var_2450_end_0, end_mask = var_2450_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2450_cast_fp16")]; tensor var_2454_begin_0 = const()[name = tensor("op_2454_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_2454_end_0 = const()[name = tensor("op_2454_end_0"), val = tensor([2, 1216, 1, 144])]; tensor var_2454_end_mask_0 = const()[name = tensor("op_2454_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2454_cast_fp16 = slice_by_index(begin = var_2454_begin_0, end = var_2454_end_0, end_mask = var_2454_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2454_cast_fp16")]; tensor var_2458_begin_0 = const()[name = tensor("op_2458_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_2458_end_0 = const()[name = tensor("op_2458_end_0"), val = tensor([2, 1280, 1, 144])]; tensor var_2458_end_mask_0 = const()[name = tensor("op_2458_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2458_cast_fp16 = slice_by_index(begin = var_2458_begin_0, end = var_2458_end_0, end_mask = var_2458_end_mask_0, x = q_17_cast_fp16)[name = tensor("op_2458_cast_fp16")]; tensor k_35_perm_0 = const()[name = tensor("k_35_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_2465_begin_0 = const()[name = tensor("op_2465_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_2465_end_0 = const()[name = tensor("op_2465_end_0"), val = tensor([2, 144, 1, 64])]; tensor var_2465_end_mask_0 = const()[name = tensor("op_2465_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_5 = transpose(perm = k_35_perm_0, x = k_33_cast_fp16)[name = tensor("transpose_5")]; tensor var_2465_cast_fp16 = slice_by_index(begin = var_2465_begin_0, end = var_2465_end_0, end_mask = var_2465_end_mask_0, x = transpose_5)[name = tensor("op_2465_cast_fp16")]; tensor var_2469_begin_0 = const()[name = tensor("op_2469_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_2469_end_0 = const()[name = tensor("op_2469_end_0"), val = tensor([2, 144, 1, 128])]; tensor var_2469_end_mask_0 = const()[name = tensor("op_2469_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2469_cast_fp16 = slice_by_index(begin = var_2469_begin_0, end = var_2469_end_0, end_mask = var_2469_end_mask_0, x = transpose_5)[name = tensor("op_2469_cast_fp16")]; tensor var_2473_begin_0 = const()[name = tensor("op_2473_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_2473_end_0 = const()[name = tensor("op_2473_end_0"), val = tensor([2, 144, 1, 192])]; tensor var_2473_end_mask_0 = const()[name = tensor("op_2473_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2473_cast_fp16 = slice_by_index(begin = var_2473_begin_0, end = var_2473_end_0, end_mask = var_2473_end_mask_0, x = transpose_5)[name = tensor("op_2473_cast_fp16")]; tensor var_2477_begin_0 = const()[name = tensor("op_2477_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_2477_end_0 = const()[name = tensor("op_2477_end_0"), val = tensor([2, 144, 1, 256])]; tensor var_2477_end_mask_0 = const()[name = tensor("op_2477_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2477_cast_fp16 = slice_by_index(begin = var_2477_begin_0, end = var_2477_end_0, end_mask = var_2477_end_mask_0, x = transpose_5)[name = tensor("op_2477_cast_fp16")]; tensor var_2481_begin_0 = const()[name = tensor("op_2481_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_2481_end_0 = const()[name = tensor("op_2481_end_0"), val = tensor([2, 144, 1, 320])]; tensor var_2481_end_mask_0 = const()[name = tensor("op_2481_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2481_cast_fp16 = slice_by_index(begin = var_2481_begin_0, end = var_2481_end_0, end_mask = var_2481_end_mask_0, x = transpose_5)[name = tensor("op_2481_cast_fp16")]; tensor var_2485_begin_0 = const()[name = tensor("op_2485_begin_0"), val = tensor([0, 0, 0, 320])]; tensor var_2485_end_0 = const()[name = tensor("op_2485_end_0"), val = tensor([2, 144, 1, 384])]; tensor var_2485_end_mask_0 = const()[name = tensor("op_2485_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2485_cast_fp16 = slice_by_index(begin = var_2485_begin_0, end = var_2485_end_0, end_mask = var_2485_end_mask_0, x = transpose_5)[name = tensor("op_2485_cast_fp16")]; tensor var_2489_begin_0 = const()[name = tensor("op_2489_begin_0"), val = tensor([0, 0, 0, 384])]; tensor var_2489_end_0 = const()[name = tensor("op_2489_end_0"), val = tensor([2, 144, 1, 448])]; tensor var_2489_end_mask_0 = const()[name = tensor("op_2489_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2489_cast_fp16 = slice_by_index(begin = var_2489_begin_0, end = var_2489_end_0, end_mask = var_2489_end_mask_0, x = transpose_5)[name = tensor("op_2489_cast_fp16")]; tensor var_2493_begin_0 = const()[name = tensor("op_2493_begin_0"), val = tensor([0, 0, 0, 448])]; tensor var_2493_end_0 = const()[name = tensor("op_2493_end_0"), val = tensor([2, 144, 1, 512])]; tensor var_2493_end_mask_0 = const()[name = tensor("op_2493_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2493_cast_fp16 = slice_by_index(begin = var_2493_begin_0, end = var_2493_end_0, end_mask = var_2493_end_mask_0, x = transpose_5)[name = tensor("op_2493_cast_fp16")]; tensor var_2497_begin_0 = const()[name = tensor("op_2497_begin_0"), val = tensor([0, 0, 0, 512])]; tensor var_2497_end_0 = const()[name = tensor("op_2497_end_0"), val = tensor([2, 144, 1, 576])]; tensor var_2497_end_mask_0 = const()[name = tensor("op_2497_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2497_cast_fp16 = slice_by_index(begin = var_2497_begin_0, end = var_2497_end_0, end_mask = var_2497_end_mask_0, x = transpose_5)[name = tensor("op_2497_cast_fp16")]; tensor var_2501_begin_0 = const()[name = tensor("op_2501_begin_0"), val = tensor([0, 0, 0, 576])]; tensor var_2501_end_0 = const()[name = tensor("op_2501_end_0"), val = tensor([2, 144, 1, 640])]; tensor var_2501_end_mask_0 = const()[name = tensor("op_2501_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2501_cast_fp16 = slice_by_index(begin = var_2501_begin_0, end = var_2501_end_0, end_mask = var_2501_end_mask_0, x = transpose_5)[name = tensor("op_2501_cast_fp16")]; tensor var_2505_begin_0 = const()[name = tensor("op_2505_begin_0"), val = tensor([0, 0, 0, 640])]; tensor var_2505_end_0 = const()[name = tensor("op_2505_end_0"), val = tensor([2, 144, 1, 704])]; tensor var_2505_end_mask_0 = const()[name = tensor("op_2505_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2505_cast_fp16 = slice_by_index(begin = var_2505_begin_0, end = var_2505_end_0, end_mask = var_2505_end_mask_0, x = transpose_5)[name = tensor("op_2505_cast_fp16")]; tensor var_2509_begin_0 = const()[name = tensor("op_2509_begin_0"), val = tensor([0, 0, 0, 704])]; tensor var_2509_end_0 = const()[name = tensor("op_2509_end_0"), val = tensor([2, 144, 1, 768])]; tensor var_2509_end_mask_0 = const()[name = tensor("op_2509_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2509_cast_fp16 = slice_by_index(begin = var_2509_begin_0, end = var_2509_end_0, end_mask = var_2509_end_mask_0, x = transpose_5)[name = tensor("op_2509_cast_fp16")]; tensor var_2513_begin_0 = const()[name = tensor("op_2513_begin_0"), val = tensor([0, 0, 0, 768])]; tensor var_2513_end_0 = const()[name = tensor("op_2513_end_0"), val = tensor([2, 144, 1, 832])]; tensor var_2513_end_mask_0 = const()[name = tensor("op_2513_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2513_cast_fp16 = slice_by_index(begin = var_2513_begin_0, end = var_2513_end_0, end_mask = var_2513_end_mask_0, x = transpose_5)[name = tensor("op_2513_cast_fp16")]; tensor var_2517_begin_0 = const()[name = tensor("op_2517_begin_0"), val = tensor([0, 0, 0, 832])]; tensor var_2517_end_0 = const()[name = tensor("op_2517_end_0"), val = tensor([2, 144, 1, 896])]; tensor var_2517_end_mask_0 = const()[name = tensor("op_2517_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2517_cast_fp16 = slice_by_index(begin = var_2517_begin_0, end = var_2517_end_0, end_mask = var_2517_end_mask_0, x = transpose_5)[name = tensor("op_2517_cast_fp16")]; tensor var_2521_begin_0 = const()[name = tensor("op_2521_begin_0"), val = tensor([0, 0, 0, 896])]; tensor var_2521_end_0 = const()[name = tensor("op_2521_end_0"), val = tensor([2, 144, 1, 960])]; tensor var_2521_end_mask_0 = const()[name = tensor("op_2521_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2521_cast_fp16 = slice_by_index(begin = var_2521_begin_0, end = var_2521_end_0, end_mask = var_2521_end_mask_0, x = transpose_5)[name = tensor("op_2521_cast_fp16")]; tensor var_2525_begin_0 = const()[name = tensor("op_2525_begin_0"), val = tensor([0, 0, 0, 960])]; tensor var_2525_end_0 = const()[name = tensor("op_2525_end_0"), val = tensor([2, 144, 1, 1024])]; tensor var_2525_end_mask_0 = const()[name = tensor("op_2525_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2525_cast_fp16 = slice_by_index(begin = var_2525_begin_0, end = var_2525_end_0, end_mask = var_2525_end_mask_0, x = transpose_5)[name = tensor("op_2525_cast_fp16")]; tensor var_2529_begin_0 = const()[name = tensor("op_2529_begin_0"), val = tensor([0, 0, 0, 1024])]; tensor var_2529_end_0 = const()[name = tensor("op_2529_end_0"), val = tensor([2, 144, 1, 1088])]; tensor var_2529_end_mask_0 = const()[name = tensor("op_2529_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2529_cast_fp16 = slice_by_index(begin = var_2529_begin_0, end = var_2529_end_0, end_mask = var_2529_end_mask_0, x = transpose_5)[name = tensor("op_2529_cast_fp16")]; tensor var_2533_begin_0 = const()[name = tensor("op_2533_begin_0"), val = tensor([0, 0, 0, 1088])]; tensor var_2533_end_0 = const()[name = tensor("op_2533_end_0"), val = tensor([2, 144, 1, 1152])]; tensor var_2533_end_mask_0 = const()[name = tensor("op_2533_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2533_cast_fp16 = slice_by_index(begin = var_2533_begin_0, end = var_2533_end_0, end_mask = var_2533_end_mask_0, x = transpose_5)[name = tensor("op_2533_cast_fp16")]; tensor var_2537_begin_0 = const()[name = tensor("op_2537_begin_0"), val = tensor([0, 0, 0, 1152])]; tensor var_2537_end_0 = const()[name = tensor("op_2537_end_0"), val = tensor([2, 144, 1, 1216])]; tensor var_2537_end_mask_0 = const()[name = tensor("op_2537_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2537_cast_fp16 = slice_by_index(begin = var_2537_begin_0, end = var_2537_end_0, end_mask = var_2537_end_mask_0, x = transpose_5)[name = tensor("op_2537_cast_fp16")]; tensor var_2541_begin_0 = const()[name = tensor("op_2541_begin_0"), val = tensor([0, 0, 0, 1216])]; tensor var_2541_end_0 = const()[name = tensor("op_2541_end_0"), val = tensor([2, 144, 1, 1280])]; tensor var_2541_end_mask_0 = const()[name = tensor("op_2541_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2541_cast_fp16 = slice_by_index(begin = var_2541_begin_0, end = var_2541_end_0, end_mask = var_2541_end_mask_0, x = transpose_5)[name = tensor("op_2541_cast_fp16")]; tensor var_2543_begin_0 = const()[name = tensor("op_2543_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_2543_end_0 = const()[name = tensor("op_2543_end_0"), val = tensor([2, 64, 1, 144])]; tensor var_2543_end_mask_0 = const()[name = tensor("op_2543_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2543_cast_fp16 = slice_by_index(begin = var_2543_begin_0, end = var_2543_end_0, end_mask = var_2543_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2543_cast_fp16")]; tensor var_2547_begin_0 = const()[name = tensor("op_2547_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_2547_end_0 = const()[name = tensor("op_2547_end_0"), val = tensor([2, 128, 1, 144])]; tensor var_2547_end_mask_0 = const()[name = tensor("op_2547_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2547_cast_fp16 = slice_by_index(begin = var_2547_begin_0, end = var_2547_end_0, end_mask = var_2547_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2547_cast_fp16")]; tensor var_2551_begin_0 = const()[name = tensor("op_2551_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_2551_end_0 = const()[name = tensor("op_2551_end_0"), val = tensor([2, 192, 1, 144])]; tensor var_2551_end_mask_0 = const()[name = tensor("op_2551_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2551_cast_fp16 = slice_by_index(begin = var_2551_begin_0, end = var_2551_end_0, end_mask = var_2551_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2551_cast_fp16")]; tensor var_2555_begin_0 = const()[name = tensor("op_2555_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_2555_end_0 = const()[name = tensor("op_2555_end_0"), val = tensor([2, 256, 1, 144])]; tensor var_2555_end_mask_0 = const()[name = tensor("op_2555_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2555_cast_fp16 = slice_by_index(begin = var_2555_begin_0, end = var_2555_end_0, end_mask = var_2555_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2555_cast_fp16")]; tensor var_2559_begin_0 = const()[name = tensor("op_2559_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_2559_end_0 = const()[name = tensor("op_2559_end_0"), val = tensor([2, 320, 1, 144])]; tensor var_2559_end_mask_0 = const()[name = tensor("op_2559_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2559_cast_fp16 = slice_by_index(begin = var_2559_begin_0, end = var_2559_end_0, end_mask = var_2559_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2559_cast_fp16")]; tensor var_2563_begin_0 = const()[name = tensor("op_2563_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_2563_end_0 = const()[name = tensor("op_2563_end_0"), val = tensor([2, 384, 1, 144])]; tensor var_2563_end_mask_0 = const()[name = tensor("op_2563_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2563_cast_fp16 = slice_by_index(begin = var_2563_begin_0, end = var_2563_end_0, end_mask = var_2563_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2563_cast_fp16")]; tensor var_2567_begin_0 = const()[name = tensor("op_2567_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_2567_end_0 = const()[name = tensor("op_2567_end_0"), val = tensor([2, 448, 1, 144])]; tensor var_2567_end_mask_0 = const()[name = tensor("op_2567_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2567_cast_fp16 = slice_by_index(begin = var_2567_begin_0, end = var_2567_end_0, end_mask = var_2567_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2567_cast_fp16")]; tensor var_2571_begin_0 = const()[name = tensor("op_2571_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_2571_end_0 = const()[name = tensor("op_2571_end_0"), val = tensor([2, 512, 1, 144])]; tensor var_2571_end_mask_0 = const()[name = tensor("op_2571_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2571_cast_fp16 = slice_by_index(begin = var_2571_begin_0, end = var_2571_end_0, end_mask = var_2571_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2571_cast_fp16")]; tensor var_2575_begin_0 = const()[name = tensor("op_2575_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_2575_end_0 = const()[name = tensor("op_2575_end_0"), val = tensor([2, 576, 1, 144])]; tensor var_2575_end_mask_0 = const()[name = tensor("op_2575_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2575_cast_fp16 = slice_by_index(begin = var_2575_begin_0, end = var_2575_end_0, end_mask = var_2575_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2575_cast_fp16")]; tensor var_2579_begin_0 = const()[name = tensor("op_2579_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_2579_end_0 = const()[name = tensor("op_2579_end_0"), val = tensor([2, 640, 1, 144])]; tensor var_2579_end_mask_0 = const()[name = tensor("op_2579_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2579_cast_fp16 = slice_by_index(begin = var_2579_begin_0, end = var_2579_end_0, end_mask = var_2579_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2579_cast_fp16")]; tensor var_2583_begin_0 = const()[name = tensor("op_2583_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_2583_end_0 = const()[name = tensor("op_2583_end_0"), val = tensor([2, 704, 1, 144])]; tensor var_2583_end_mask_0 = const()[name = tensor("op_2583_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2583_cast_fp16 = slice_by_index(begin = var_2583_begin_0, end = var_2583_end_0, end_mask = var_2583_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2583_cast_fp16")]; tensor var_2587_begin_0 = const()[name = tensor("op_2587_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_2587_end_0 = const()[name = tensor("op_2587_end_0"), val = tensor([2, 768, 1, 144])]; tensor var_2587_end_mask_0 = const()[name = tensor("op_2587_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2587_cast_fp16 = slice_by_index(begin = var_2587_begin_0, end = var_2587_end_0, end_mask = var_2587_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2587_cast_fp16")]; tensor var_2591_begin_0 = const()[name = tensor("op_2591_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_2591_end_0 = const()[name = tensor("op_2591_end_0"), val = tensor([2, 832, 1, 144])]; tensor var_2591_end_mask_0 = const()[name = tensor("op_2591_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2591_cast_fp16 = slice_by_index(begin = var_2591_begin_0, end = var_2591_end_0, end_mask = var_2591_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2591_cast_fp16")]; tensor var_2595_begin_0 = const()[name = tensor("op_2595_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_2595_end_0 = const()[name = tensor("op_2595_end_0"), val = tensor([2, 896, 1, 144])]; tensor var_2595_end_mask_0 = const()[name = tensor("op_2595_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2595_cast_fp16 = slice_by_index(begin = var_2595_begin_0, end = var_2595_end_0, end_mask = var_2595_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2595_cast_fp16")]; tensor var_2599_begin_0 = const()[name = tensor("op_2599_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_2599_end_0 = const()[name = tensor("op_2599_end_0"), val = tensor([2, 960, 1, 144])]; tensor var_2599_end_mask_0 = const()[name = tensor("op_2599_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2599_cast_fp16 = slice_by_index(begin = var_2599_begin_0, end = var_2599_end_0, end_mask = var_2599_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2599_cast_fp16")]; tensor var_2603_begin_0 = const()[name = tensor("op_2603_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_2603_end_0 = const()[name = tensor("op_2603_end_0"), val = tensor([2, 1024, 1, 144])]; tensor var_2603_end_mask_0 = const()[name = tensor("op_2603_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2603_cast_fp16 = slice_by_index(begin = var_2603_begin_0, end = var_2603_end_0, end_mask = var_2603_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2603_cast_fp16")]; tensor var_2607_begin_0 = const()[name = tensor("op_2607_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_2607_end_0 = const()[name = tensor("op_2607_end_0"), val = tensor([2, 1088, 1, 144])]; tensor var_2607_end_mask_0 = const()[name = tensor("op_2607_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2607_cast_fp16 = slice_by_index(begin = var_2607_begin_0, end = var_2607_end_0, end_mask = var_2607_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2607_cast_fp16")]; tensor var_2611_begin_0 = const()[name = tensor("op_2611_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_2611_end_0 = const()[name = tensor("op_2611_end_0"), val = tensor([2, 1152, 1, 144])]; tensor var_2611_end_mask_0 = const()[name = tensor("op_2611_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2611_cast_fp16 = slice_by_index(begin = var_2611_begin_0, end = var_2611_end_0, end_mask = var_2611_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2611_cast_fp16")]; tensor var_2615_begin_0 = const()[name = tensor("op_2615_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_2615_end_0 = const()[name = tensor("op_2615_end_0"), val = tensor([2, 1216, 1, 144])]; tensor var_2615_end_mask_0 = const()[name = tensor("op_2615_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2615_cast_fp16 = slice_by_index(begin = var_2615_begin_0, end = var_2615_end_0, end_mask = var_2615_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2615_cast_fp16")]; tensor var_2619_begin_0 = const()[name = tensor("op_2619_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_2619_end_0 = const()[name = tensor("op_2619_end_0"), val = tensor([2, 1280, 1, 144])]; tensor var_2619_end_mask_0 = const()[name = tensor("op_2619_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2619_cast_fp16 = slice_by_index(begin = var_2619_begin_0, end = var_2619_end_0, end_mask = var_2619_end_mask_0, x = v_17_cast_fp16)[name = tensor("op_2619_cast_fp16")]; tensor var_2623_equation_0 = const()[name = tensor("op_2623_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2623_cast_fp16 = einsum(equation = var_2623_equation_0, values = (var_2465_cast_fp16, var_2382_cast_fp16))[name = tensor("op_2623_cast_fp16")]; tensor var_2624_to_fp16 = const()[name = tensor("op_2624_to_fp16"), val = tensor(0x1p-3)]; tensor aw_121_cast_fp16 = mul(x = var_2623_cast_fp16, y = var_2624_to_fp16)[name = tensor("aw_121_cast_fp16")]; tensor var_2627_equation_0 = const()[name = tensor("op_2627_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2627_cast_fp16 = einsum(equation = var_2627_equation_0, values = (var_2469_cast_fp16, var_2386_cast_fp16))[name = tensor("op_2627_cast_fp16")]; tensor var_2628_to_fp16 = const()[name = tensor("op_2628_to_fp16"), val = tensor(0x1p-3)]; tensor aw_123_cast_fp16 = mul(x = var_2627_cast_fp16, y = var_2628_to_fp16)[name = tensor("aw_123_cast_fp16")]; tensor var_2631_equation_0 = const()[name = tensor("op_2631_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2631_cast_fp16 = einsum(equation = var_2631_equation_0, values = (var_2473_cast_fp16, var_2390_cast_fp16))[name = tensor("op_2631_cast_fp16")]; tensor var_2632_to_fp16 = const()[name = tensor("op_2632_to_fp16"), val = tensor(0x1p-3)]; tensor aw_125_cast_fp16 = mul(x = var_2631_cast_fp16, y = var_2632_to_fp16)[name = tensor("aw_125_cast_fp16")]; tensor var_2635_equation_0 = const()[name = tensor("op_2635_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2635_cast_fp16 = einsum(equation = var_2635_equation_0, values = (var_2477_cast_fp16, var_2394_cast_fp16))[name = tensor("op_2635_cast_fp16")]; tensor var_2636_to_fp16 = const()[name = tensor("op_2636_to_fp16"), val = tensor(0x1p-3)]; tensor aw_127_cast_fp16 = mul(x = var_2635_cast_fp16, y = var_2636_to_fp16)[name = tensor("aw_127_cast_fp16")]; tensor var_2639_equation_0 = const()[name = tensor("op_2639_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2639_cast_fp16 = einsum(equation = var_2639_equation_0, values = (var_2481_cast_fp16, var_2398_cast_fp16))[name = tensor("op_2639_cast_fp16")]; tensor var_2640_to_fp16 = const()[name = tensor("op_2640_to_fp16"), val = tensor(0x1p-3)]; tensor aw_129_cast_fp16 = mul(x = var_2639_cast_fp16, y = var_2640_to_fp16)[name = tensor("aw_129_cast_fp16")]; tensor var_2643_equation_0 = const()[name = tensor("op_2643_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2643_cast_fp16 = einsum(equation = var_2643_equation_0, values = (var_2485_cast_fp16, var_2402_cast_fp16))[name = tensor("op_2643_cast_fp16")]; tensor var_2644_to_fp16 = const()[name = tensor("op_2644_to_fp16"), val = tensor(0x1p-3)]; tensor aw_131_cast_fp16 = mul(x = var_2643_cast_fp16, y = var_2644_to_fp16)[name = tensor("aw_131_cast_fp16")]; tensor var_2647_equation_0 = const()[name = tensor("op_2647_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2647_cast_fp16 = einsum(equation = var_2647_equation_0, values = (var_2489_cast_fp16, var_2406_cast_fp16))[name = tensor("op_2647_cast_fp16")]; tensor var_2648_to_fp16 = const()[name = tensor("op_2648_to_fp16"), val = tensor(0x1p-3)]; tensor aw_133_cast_fp16 = mul(x = var_2647_cast_fp16, y = var_2648_to_fp16)[name = tensor("aw_133_cast_fp16")]; tensor var_2651_equation_0 = const()[name = tensor("op_2651_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2651_cast_fp16 = einsum(equation = var_2651_equation_0, values = (var_2493_cast_fp16, var_2410_cast_fp16))[name = tensor("op_2651_cast_fp16")]; tensor var_2652_to_fp16 = const()[name = tensor("op_2652_to_fp16"), val = tensor(0x1p-3)]; tensor aw_135_cast_fp16 = mul(x = var_2651_cast_fp16, y = var_2652_to_fp16)[name = tensor("aw_135_cast_fp16")]; tensor var_2655_equation_0 = const()[name = tensor("op_2655_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2655_cast_fp16 = einsum(equation = var_2655_equation_0, values = (var_2497_cast_fp16, var_2414_cast_fp16))[name = tensor("op_2655_cast_fp16")]; tensor var_2656_to_fp16 = const()[name = tensor("op_2656_to_fp16"), val = tensor(0x1p-3)]; tensor aw_137_cast_fp16 = mul(x = var_2655_cast_fp16, y = var_2656_to_fp16)[name = tensor("aw_137_cast_fp16")]; tensor var_2659_equation_0 = const()[name = tensor("op_2659_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2659_cast_fp16 = einsum(equation = var_2659_equation_0, values = (var_2501_cast_fp16, var_2418_cast_fp16))[name = tensor("op_2659_cast_fp16")]; tensor var_2660_to_fp16 = const()[name = tensor("op_2660_to_fp16"), val = tensor(0x1p-3)]; tensor aw_139_cast_fp16 = mul(x = var_2659_cast_fp16, y = var_2660_to_fp16)[name = tensor("aw_139_cast_fp16")]; tensor var_2663_equation_0 = const()[name = tensor("op_2663_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2663_cast_fp16 = einsum(equation = var_2663_equation_0, values = (var_2505_cast_fp16, var_2422_cast_fp16))[name = tensor("op_2663_cast_fp16")]; tensor var_2664_to_fp16 = const()[name = tensor("op_2664_to_fp16"), val = tensor(0x1p-3)]; tensor aw_141_cast_fp16 = mul(x = var_2663_cast_fp16, y = var_2664_to_fp16)[name = tensor("aw_141_cast_fp16")]; tensor var_2667_equation_0 = const()[name = tensor("op_2667_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2667_cast_fp16 = einsum(equation = var_2667_equation_0, values = (var_2509_cast_fp16, var_2426_cast_fp16))[name = tensor("op_2667_cast_fp16")]; tensor var_2668_to_fp16 = const()[name = tensor("op_2668_to_fp16"), val = tensor(0x1p-3)]; tensor aw_143_cast_fp16 = mul(x = var_2667_cast_fp16, y = var_2668_to_fp16)[name = tensor("aw_143_cast_fp16")]; tensor var_2671_equation_0 = const()[name = tensor("op_2671_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2671_cast_fp16 = einsum(equation = var_2671_equation_0, values = (var_2513_cast_fp16, var_2430_cast_fp16))[name = tensor("op_2671_cast_fp16")]; tensor var_2672_to_fp16 = const()[name = tensor("op_2672_to_fp16"), val = tensor(0x1p-3)]; tensor aw_145_cast_fp16 = mul(x = var_2671_cast_fp16, y = var_2672_to_fp16)[name = tensor("aw_145_cast_fp16")]; tensor var_2675_equation_0 = const()[name = tensor("op_2675_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2675_cast_fp16 = einsum(equation = var_2675_equation_0, values = (var_2517_cast_fp16, var_2434_cast_fp16))[name = tensor("op_2675_cast_fp16")]; tensor var_2676_to_fp16 = const()[name = tensor("op_2676_to_fp16"), val = tensor(0x1p-3)]; tensor aw_147_cast_fp16 = mul(x = var_2675_cast_fp16, y = var_2676_to_fp16)[name = tensor("aw_147_cast_fp16")]; tensor var_2679_equation_0 = const()[name = tensor("op_2679_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2679_cast_fp16 = einsum(equation = var_2679_equation_0, values = (var_2521_cast_fp16, var_2438_cast_fp16))[name = tensor("op_2679_cast_fp16")]; tensor var_2680_to_fp16 = const()[name = tensor("op_2680_to_fp16"), val = tensor(0x1p-3)]; tensor aw_149_cast_fp16 = mul(x = var_2679_cast_fp16, y = var_2680_to_fp16)[name = tensor("aw_149_cast_fp16")]; tensor var_2683_equation_0 = const()[name = tensor("op_2683_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2683_cast_fp16 = einsum(equation = var_2683_equation_0, values = (var_2525_cast_fp16, var_2442_cast_fp16))[name = tensor("op_2683_cast_fp16")]; tensor var_2684_to_fp16 = const()[name = tensor("op_2684_to_fp16"), val = tensor(0x1p-3)]; tensor aw_151_cast_fp16 = mul(x = var_2683_cast_fp16, y = var_2684_to_fp16)[name = tensor("aw_151_cast_fp16")]; tensor var_2687_equation_0 = const()[name = tensor("op_2687_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2687_cast_fp16 = einsum(equation = var_2687_equation_0, values = (var_2529_cast_fp16, var_2446_cast_fp16))[name = tensor("op_2687_cast_fp16")]; tensor var_2688_to_fp16 = const()[name = tensor("op_2688_to_fp16"), val = tensor(0x1p-3)]; tensor aw_153_cast_fp16 = mul(x = var_2687_cast_fp16, y = var_2688_to_fp16)[name = tensor("aw_153_cast_fp16")]; tensor var_2691_equation_0 = const()[name = tensor("op_2691_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2691_cast_fp16 = einsum(equation = var_2691_equation_0, values = (var_2533_cast_fp16, var_2450_cast_fp16))[name = tensor("op_2691_cast_fp16")]; tensor var_2692_to_fp16 = const()[name = tensor("op_2692_to_fp16"), val = tensor(0x1p-3)]; tensor aw_155_cast_fp16 = mul(x = var_2691_cast_fp16, y = var_2692_to_fp16)[name = tensor("aw_155_cast_fp16")]; tensor var_2695_equation_0 = const()[name = tensor("op_2695_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2695_cast_fp16 = einsum(equation = var_2695_equation_0, values = (var_2537_cast_fp16, var_2454_cast_fp16))[name = tensor("op_2695_cast_fp16")]; tensor var_2696_to_fp16 = const()[name = tensor("op_2696_to_fp16"), val = tensor(0x1p-3)]; tensor aw_157_cast_fp16 = mul(x = var_2695_cast_fp16, y = var_2696_to_fp16)[name = tensor("aw_157_cast_fp16")]; tensor var_2699_equation_0 = const()[name = tensor("op_2699_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_2699_cast_fp16 = einsum(equation = var_2699_equation_0, values = (var_2541_cast_fp16, var_2458_cast_fp16))[name = tensor("op_2699_cast_fp16")]; tensor var_2700_to_fp16 = const()[name = tensor("op_2700_to_fp16"), val = tensor(0x1p-3)]; tensor aw_159_cast_fp16 = mul(x = var_2699_cast_fp16, y = var_2700_to_fp16)[name = tensor("aw_159_cast_fp16")]; tensor var_2702_cast_fp16 = softmax(axis = var_2254, x = aw_121_cast_fp16)[name = tensor("op_2702_cast_fp16")]; tensor var_2703_cast_fp16 = softmax(axis = var_2254, x = aw_123_cast_fp16)[name = tensor("op_2703_cast_fp16")]; tensor var_2704_cast_fp16 = softmax(axis = var_2254, x = aw_125_cast_fp16)[name = tensor("op_2704_cast_fp16")]; tensor var_2705_cast_fp16 = softmax(axis = var_2254, x = aw_127_cast_fp16)[name = tensor("op_2705_cast_fp16")]; tensor var_2706_cast_fp16 = softmax(axis = var_2254, x = aw_129_cast_fp16)[name = tensor("op_2706_cast_fp16")]; tensor var_2707_cast_fp16 = softmax(axis = var_2254, x = aw_131_cast_fp16)[name = tensor("op_2707_cast_fp16")]; tensor var_2708_cast_fp16 = softmax(axis = var_2254, x = aw_133_cast_fp16)[name = tensor("op_2708_cast_fp16")]; tensor var_2709_cast_fp16 = softmax(axis = var_2254, x = aw_135_cast_fp16)[name = tensor("op_2709_cast_fp16")]; tensor var_2710_cast_fp16 = softmax(axis = var_2254, x = aw_137_cast_fp16)[name = tensor("op_2710_cast_fp16")]; tensor var_2711_cast_fp16 = softmax(axis = var_2254, x = aw_139_cast_fp16)[name = tensor("op_2711_cast_fp16")]; tensor var_2712_cast_fp16 = softmax(axis = var_2254, x = aw_141_cast_fp16)[name = tensor("op_2712_cast_fp16")]; tensor var_2713_cast_fp16 = softmax(axis = var_2254, x = aw_143_cast_fp16)[name = tensor("op_2713_cast_fp16")]; tensor var_2714_cast_fp16 = softmax(axis = var_2254, x = aw_145_cast_fp16)[name = tensor("op_2714_cast_fp16")]; tensor var_2715_cast_fp16 = softmax(axis = var_2254, x = aw_147_cast_fp16)[name = tensor("op_2715_cast_fp16")]; tensor var_2716_cast_fp16 = softmax(axis = var_2254, x = aw_149_cast_fp16)[name = tensor("op_2716_cast_fp16")]; tensor var_2717_cast_fp16 = softmax(axis = var_2254, x = aw_151_cast_fp16)[name = tensor("op_2717_cast_fp16")]; tensor var_2718_cast_fp16 = softmax(axis = var_2254, x = aw_153_cast_fp16)[name = tensor("op_2718_cast_fp16")]; tensor var_2719_cast_fp16 = softmax(axis = var_2254, x = aw_155_cast_fp16)[name = tensor("op_2719_cast_fp16")]; tensor var_2720_cast_fp16 = softmax(axis = var_2254, x = aw_157_cast_fp16)[name = tensor("op_2720_cast_fp16")]; tensor var_2721_cast_fp16 = softmax(axis = var_2254, x = aw_159_cast_fp16)[name = tensor("op_2721_cast_fp16")]; tensor var_2723_equation_0 = const()[name = tensor("op_2723_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2723_cast_fp16 = einsum(equation = var_2723_equation_0, values = (var_2543_cast_fp16, var_2702_cast_fp16))[name = tensor("op_2723_cast_fp16")]; tensor var_2725_equation_0 = const()[name = tensor("op_2725_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2725_cast_fp16 = einsum(equation = var_2725_equation_0, values = (var_2547_cast_fp16, var_2703_cast_fp16))[name = tensor("op_2725_cast_fp16")]; tensor var_2727_equation_0 = const()[name = tensor("op_2727_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2727_cast_fp16 = einsum(equation = var_2727_equation_0, values = (var_2551_cast_fp16, var_2704_cast_fp16))[name = tensor("op_2727_cast_fp16")]; tensor var_2729_equation_0 = const()[name = tensor("op_2729_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2729_cast_fp16 = einsum(equation = var_2729_equation_0, values = (var_2555_cast_fp16, var_2705_cast_fp16))[name = tensor("op_2729_cast_fp16")]; tensor var_2731_equation_0 = const()[name = tensor("op_2731_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2731_cast_fp16 = einsum(equation = var_2731_equation_0, values = (var_2559_cast_fp16, var_2706_cast_fp16))[name = tensor("op_2731_cast_fp16")]; tensor var_2733_equation_0 = const()[name = tensor("op_2733_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2733_cast_fp16 = einsum(equation = var_2733_equation_0, values = (var_2563_cast_fp16, var_2707_cast_fp16))[name = tensor("op_2733_cast_fp16")]; tensor var_2735_equation_0 = const()[name = tensor("op_2735_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2735_cast_fp16 = einsum(equation = var_2735_equation_0, values = (var_2567_cast_fp16, var_2708_cast_fp16))[name = tensor("op_2735_cast_fp16")]; tensor var_2737_equation_0 = const()[name = tensor("op_2737_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2737_cast_fp16 = einsum(equation = var_2737_equation_0, values = (var_2571_cast_fp16, var_2709_cast_fp16))[name = tensor("op_2737_cast_fp16")]; tensor var_2739_equation_0 = const()[name = tensor("op_2739_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2739_cast_fp16 = einsum(equation = var_2739_equation_0, values = (var_2575_cast_fp16, var_2710_cast_fp16))[name = tensor("op_2739_cast_fp16")]; tensor var_2741_equation_0 = const()[name = tensor("op_2741_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2741_cast_fp16 = einsum(equation = var_2741_equation_0, values = (var_2579_cast_fp16, var_2711_cast_fp16))[name = tensor("op_2741_cast_fp16")]; tensor var_2743_equation_0 = const()[name = tensor("op_2743_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2743_cast_fp16 = einsum(equation = var_2743_equation_0, values = (var_2583_cast_fp16, var_2712_cast_fp16))[name = tensor("op_2743_cast_fp16")]; tensor var_2745_equation_0 = const()[name = tensor("op_2745_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2745_cast_fp16 = einsum(equation = var_2745_equation_0, values = (var_2587_cast_fp16, var_2713_cast_fp16))[name = tensor("op_2745_cast_fp16")]; tensor var_2747_equation_0 = const()[name = tensor("op_2747_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2747_cast_fp16 = einsum(equation = var_2747_equation_0, values = (var_2591_cast_fp16, var_2714_cast_fp16))[name = tensor("op_2747_cast_fp16")]; tensor var_2749_equation_0 = const()[name = tensor("op_2749_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2749_cast_fp16 = einsum(equation = var_2749_equation_0, values = (var_2595_cast_fp16, var_2715_cast_fp16))[name = tensor("op_2749_cast_fp16")]; tensor var_2751_equation_0 = const()[name = tensor("op_2751_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2751_cast_fp16 = einsum(equation = var_2751_equation_0, values = (var_2599_cast_fp16, var_2716_cast_fp16))[name = tensor("op_2751_cast_fp16")]; tensor var_2753_equation_0 = const()[name = tensor("op_2753_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2753_cast_fp16 = einsum(equation = var_2753_equation_0, values = (var_2603_cast_fp16, var_2717_cast_fp16))[name = tensor("op_2753_cast_fp16")]; tensor var_2755_equation_0 = const()[name = tensor("op_2755_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2755_cast_fp16 = einsum(equation = var_2755_equation_0, values = (var_2607_cast_fp16, var_2718_cast_fp16))[name = tensor("op_2755_cast_fp16")]; tensor var_2757_equation_0 = const()[name = tensor("op_2757_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2757_cast_fp16 = einsum(equation = var_2757_equation_0, values = (var_2611_cast_fp16, var_2719_cast_fp16))[name = tensor("op_2757_cast_fp16")]; tensor var_2759_equation_0 = const()[name = tensor("op_2759_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2759_cast_fp16 = einsum(equation = var_2759_equation_0, values = (var_2615_cast_fp16, var_2720_cast_fp16))[name = tensor("op_2759_cast_fp16")]; tensor var_2761_equation_0 = const()[name = tensor("op_2761_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_2761_cast_fp16 = einsum(equation = var_2761_equation_0, values = (var_2619_cast_fp16, var_2721_cast_fp16))[name = tensor("op_2761_cast_fp16")]; tensor input_133_interleave_0 = const()[name = tensor("input_133_interleave_0"), val = tensor(false)]; tensor input_133_cast_fp16 = concat(axis = var_2254, interleave = input_133_interleave_0, values = (var_2723_cast_fp16, var_2725_cast_fp16, var_2727_cast_fp16, var_2729_cast_fp16, var_2731_cast_fp16, var_2733_cast_fp16, var_2735_cast_fp16, var_2737_cast_fp16, var_2739_cast_fp16, var_2741_cast_fp16, var_2743_cast_fp16, var_2745_cast_fp16, var_2747_cast_fp16, var_2749_cast_fp16, var_2751_cast_fp16, var_2753_cast_fp16, var_2755_cast_fp16, var_2757_cast_fp16, var_2759_cast_fp16, var_2761_cast_fp16))[name = tensor("input_133_cast_fp16")]; tensor var_2767 = const()[name = tensor("op_2767"), val = tensor([1, 1])]; tensor var_2769 = const()[name = tensor("op_2769"), val = tensor([1, 1])]; tensor var_2771_pad_type_0 = const()[name = tensor("op_2771_pad_type_0"), val = tensor("custom")]; tensor var_2771_pad_0 = const()[name = tensor("op_2771_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163088000)))]; tensor down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166364864)))]; tensor var_2771_cast_fp16 = conv(bias = down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_2769, groups = var_2254, pad = var_2771_pad_0, pad_type = var_2771_pad_type_0, strides = var_2767, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_133_cast_fp16)[name = tensor("op_2771_cast_fp16")]; tensor inputs_27_cast_fp16 = add(x = var_2771_cast_fp16, y = inputs_25_cast_fp16)[name = tensor("inputs_27_cast_fp16")]; tensor var_2775 = const()[name = tensor("op_2775"), val = tensor([1])]; tensor channels_mean_27_cast_fp16 = reduce_mean(axes = var_2775, keep_dims = var_2249, x = inputs_27_cast_fp16)[name = tensor("channels_mean_27_cast_fp16")]; tensor zero_mean_27_cast_fp16 = sub(x = inputs_27_cast_fp16, y = channels_mean_27_cast_fp16)[name = tensor("zero_mean_27_cast_fp16")]; tensor zero_mean_sq_27_cast_fp16 = mul(x = zero_mean_27_cast_fp16, y = zero_mean_27_cast_fp16)[name = tensor("zero_mean_sq_27_cast_fp16")]; tensor var_2779 = const()[name = tensor("op_2779"), val = tensor([1])]; tensor var_2780_cast_fp16 = reduce_mean(axes = var_2779, keep_dims = var_2249, x = zero_mean_sq_27_cast_fp16)[name = tensor("op_2780_cast_fp16")]; tensor var_2781_to_fp16 = const()[name = tensor("op_2781_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2782_cast_fp16 = add(x = var_2780_cast_fp16, y = var_2781_to_fp16)[name = tensor("op_2782_cast_fp16")]; tensor denom_27_epsilon_0_to_fp16 = const()[name = tensor("denom_27_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_27_cast_fp16 = rsqrt(epsilon = denom_27_epsilon_0_to_fp16, x = var_2782_cast_fp16)[name = tensor("denom_27_cast_fp16")]; tensor out_27_cast_fp16 = mul(x = zero_mean_27_cast_fp16, y = denom_27_cast_fp16)[name = tensor("out_27_cast_fp16")]; tensor var_2786_to_fp16 = const()[name = tensor("op_2786_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166367488)))]; tensor var_2787_cast_fp16 = add(x = out_27_cast_fp16, y = var_2786_to_fp16)[name = tensor("op_2787_cast_fp16")]; tensor var_2789_to_fp16 = const()[name = tensor("op_2789_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166370112)))]; tensor hidden_states_83_cast_fp16 = mul(x = var_2787_cast_fp16, y = var_2789_to_fp16)[name = tensor("hidden_states_83_cast_fp16")]; tensor var_2796 = const()[name = tensor("op_2796"), val = tensor([1, 1])]; tensor var_2798 = const()[name = tensor("op_2798"), val = tensor([1, 1])]; tensor q_19_pad_type_0 = const()[name = tensor("q_19_pad_type_0"), val = tensor("custom")]; tensor q_19_pad_0 = const()[name = tensor("q_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(166372736)))]; tensor q_19_cast_fp16 = conv(dilations = var_2798, groups = var_2254, pad = q_19_pad_0, pad_type = q_19_pad_type_0, strides = var_2796, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_83_cast_fp16)[name = tensor("q_19_cast_fp16")]; tensor var_2802 = const()[name = tensor("op_2802"), val = tensor([1, 1])]; tensor var_2804 = const()[name = tensor("op_2804"), val = tensor([1, 1])]; tensor k_37_pad_type_0 = const()[name = tensor("k_37_pad_type_0"), val = tensor("custom")]; tensor k_37_pad_0 = const()[name = tensor("k_37_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169649600)))]; tensor k_37_cast_fp16 = conv(dilations = var_2804, groups = var_2254, pad = k_37_pad_0, pad_type = k_37_pad_type_0, strides = var_2802, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_37_cast_fp16")]; tensor var_2808 = const()[name = tensor("op_2808"), val = tensor([1, 1])]; tensor var_2810 = const()[name = tensor("op_2810"), val = tensor([1, 1])]; tensor v_19_pad_type_0 = const()[name = tensor("v_19_pad_type_0"), val = tensor("custom")]; tensor v_19_pad_0 = const()[name = tensor("v_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(172271104)))]; tensor v_19_cast_fp16 = conv(dilations = var_2810, groups = var_2254, pad = v_19_pad_0, pad_type = v_19_pad_type_0, strides = var_2808, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_19_cast_fp16")]; tensor var_2814_begin_0 = const()[name = tensor("op_2814_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_2814_end_0 = const()[name = tensor("op_2814_end_0"), val = tensor([2, 64, 1, 144])]; tensor var_2814_end_mask_0 = const()[name = tensor("op_2814_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2814_cast_fp16 = slice_by_index(begin = var_2814_begin_0, end = var_2814_end_0, end_mask = var_2814_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2814_cast_fp16")]; tensor var_2818_begin_0 = const()[name = tensor("op_2818_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_2818_end_0 = const()[name = tensor("op_2818_end_0"), val = tensor([2, 128, 1, 144])]; tensor var_2818_end_mask_0 = const()[name = tensor("op_2818_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2818_cast_fp16 = slice_by_index(begin = var_2818_begin_0, end = var_2818_end_0, end_mask = var_2818_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2818_cast_fp16")]; tensor var_2822_begin_0 = const()[name = tensor("op_2822_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_2822_end_0 = const()[name = tensor("op_2822_end_0"), val = tensor([2, 192, 1, 144])]; tensor var_2822_end_mask_0 = const()[name = tensor("op_2822_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2822_cast_fp16 = slice_by_index(begin = var_2822_begin_0, end = var_2822_end_0, end_mask = var_2822_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2822_cast_fp16")]; tensor var_2826_begin_0 = const()[name = tensor("op_2826_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_2826_end_0 = const()[name = tensor("op_2826_end_0"), val = tensor([2, 256, 1, 144])]; tensor var_2826_end_mask_0 = const()[name = tensor("op_2826_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2826_cast_fp16 = slice_by_index(begin = var_2826_begin_0, end = var_2826_end_0, end_mask = var_2826_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2826_cast_fp16")]; tensor var_2830_begin_0 = const()[name = tensor("op_2830_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_2830_end_0 = const()[name = tensor("op_2830_end_0"), val = tensor([2, 320, 1, 144])]; tensor var_2830_end_mask_0 = const()[name = tensor("op_2830_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2830_cast_fp16 = slice_by_index(begin = var_2830_begin_0, end = var_2830_end_0, end_mask = var_2830_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2830_cast_fp16")]; tensor var_2834_begin_0 = const()[name = tensor("op_2834_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_2834_end_0 = const()[name = tensor("op_2834_end_0"), val = tensor([2, 384, 1, 144])]; tensor var_2834_end_mask_0 = const()[name = tensor("op_2834_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2834_cast_fp16 = slice_by_index(begin = var_2834_begin_0, end = var_2834_end_0, end_mask = var_2834_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2834_cast_fp16")]; tensor var_2838_begin_0 = const()[name = tensor("op_2838_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_2838_end_0 = const()[name = tensor("op_2838_end_0"), val = tensor([2, 448, 1, 144])]; tensor var_2838_end_mask_0 = const()[name = tensor("op_2838_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2838_cast_fp16 = slice_by_index(begin = var_2838_begin_0, end = var_2838_end_0, end_mask = var_2838_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2838_cast_fp16")]; tensor var_2842_begin_0 = const()[name = tensor("op_2842_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_2842_end_0 = const()[name = tensor("op_2842_end_0"), val = tensor([2, 512, 1, 144])]; tensor var_2842_end_mask_0 = const()[name = tensor("op_2842_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2842_cast_fp16 = slice_by_index(begin = var_2842_begin_0, end = var_2842_end_0, end_mask = var_2842_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2842_cast_fp16")]; tensor var_2846_begin_0 = const()[name = tensor("op_2846_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_2846_end_0 = const()[name = tensor("op_2846_end_0"), val = tensor([2, 576, 1, 144])]; tensor var_2846_end_mask_0 = const()[name = tensor("op_2846_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2846_cast_fp16 = slice_by_index(begin = var_2846_begin_0, end = var_2846_end_0, end_mask = var_2846_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2846_cast_fp16")]; tensor var_2850_begin_0 = const()[name = tensor("op_2850_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_2850_end_0 = const()[name = tensor("op_2850_end_0"), val = tensor([2, 640, 1, 144])]; tensor var_2850_end_mask_0 = const()[name = tensor("op_2850_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2850_cast_fp16 = slice_by_index(begin = var_2850_begin_0, end = var_2850_end_0, end_mask = var_2850_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2850_cast_fp16")]; tensor var_2854_begin_0 = const()[name = tensor("op_2854_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_2854_end_0 = const()[name = tensor("op_2854_end_0"), val = tensor([2, 704, 1, 144])]; tensor var_2854_end_mask_0 = const()[name = tensor("op_2854_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2854_cast_fp16 = slice_by_index(begin = var_2854_begin_0, end = var_2854_end_0, end_mask = var_2854_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2854_cast_fp16")]; tensor var_2858_begin_0 = const()[name = tensor("op_2858_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_2858_end_0 = const()[name = tensor("op_2858_end_0"), val = tensor([2, 768, 1, 144])]; tensor var_2858_end_mask_0 = const()[name = tensor("op_2858_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2858_cast_fp16 = slice_by_index(begin = var_2858_begin_0, end = var_2858_end_0, end_mask = var_2858_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2858_cast_fp16")]; tensor var_2862_begin_0 = const()[name = tensor("op_2862_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_2862_end_0 = const()[name = tensor("op_2862_end_0"), val = tensor([2, 832, 1, 144])]; tensor var_2862_end_mask_0 = const()[name = tensor("op_2862_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2862_cast_fp16 = slice_by_index(begin = var_2862_begin_0, end = var_2862_end_0, end_mask = var_2862_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2862_cast_fp16")]; tensor var_2866_begin_0 = const()[name = tensor("op_2866_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_2866_end_0 = const()[name = tensor("op_2866_end_0"), val = tensor([2, 896, 1, 144])]; tensor var_2866_end_mask_0 = const()[name = tensor("op_2866_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2866_cast_fp16 = slice_by_index(begin = var_2866_begin_0, end = var_2866_end_0, end_mask = var_2866_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2866_cast_fp16")]; tensor var_2870_begin_0 = const()[name = tensor("op_2870_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_2870_end_0 = const()[name = tensor("op_2870_end_0"), val = tensor([2, 960, 1, 144])]; tensor var_2870_end_mask_0 = const()[name = tensor("op_2870_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2870_cast_fp16 = slice_by_index(begin = var_2870_begin_0, end = var_2870_end_0, end_mask = var_2870_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2870_cast_fp16")]; tensor var_2874_begin_0 = const()[name = tensor("op_2874_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_2874_end_0 = const()[name = tensor("op_2874_end_0"), val = tensor([2, 1024, 1, 144])]; tensor var_2874_end_mask_0 = const()[name = tensor("op_2874_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2874_cast_fp16 = slice_by_index(begin = var_2874_begin_0, end = var_2874_end_0, end_mask = var_2874_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2874_cast_fp16")]; tensor var_2878_begin_0 = const()[name = tensor("op_2878_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_2878_end_0 = const()[name = tensor("op_2878_end_0"), val = tensor([2, 1088, 1, 144])]; tensor var_2878_end_mask_0 = const()[name = tensor("op_2878_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2878_cast_fp16 = slice_by_index(begin = var_2878_begin_0, end = var_2878_end_0, end_mask = var_2878_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2878_cast_fp16")]; tensor var_2882_begin_0 = const()[name = tensor("op_2882_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_2882_end_0 = const()[name = tensor("op_2882_end_0"), val = tensor([2, 1152, 1, 144])]; tensor var_2882_end_mask_0 = const()[name = tensor("op_2882_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2882_cast_fp16 = slice_by_index(begin = var_2882_begin_0, end = var_2882_end_0, end_mask = var_2882_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2882_cast_fp16")]; tensor var_2886_begin_0 = const()[name = tensor("op_2886_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_2886_end_0 = const()[name = tensor("op_2886_end_0"), val = tensor([2, 1216, 1, 144])]; tensor var_2886_end_mask_0 = const()[name = tensor("op_2886_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2886_cast_fp16 = slice_by_index(begin = var_2886_begin_0, end = var_2886_end_0, end_mask = var_2886_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2886_cast_fp16")]; tensor var_2890_begin_0 = const()[name = tensor("op_2890_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_2890_end_0 = const()[name = tensor("op_2890_end_0"), val = tensor([2, 1280, 1, 144])]; tensor var_2890_end_mask_0 = const()[name = tensor("op_2890_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2890_cast_fp16 = slice_by_index(begin = var_2890_begin_0, end = var_2890_end_0, end_mask = var_2890_end_mask_0, x = q_19_cast_fp16)[name = tensor("op_2890_cast_fp16")]; tensor k_39_perm_0 = const()[name = tensor("k_39_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_2897_begin_0 = const()[name = tensor("op_2897_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_2897_end_0 = const()[name = tensor("op_2897_end_0"), val = tensor([2, 77, 1, 64])]; tensor var_2897_end_mask_0 = const()[name = tensor("op_2897_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_4 = transpose(perm = k_39_perm_0, x = k_37_cast_fp16)[name = tensor("transpose_4")]; tensor var_2897_cast_fp16 = slice_by_index(begin = var_2897_begin_0, end = var_2897_end_0, end_mask = var_2897_end_mask_0, x = transpose_4)[name = tensor("op_2897_cast_fp16")]; tensor var_2901_begin_0 = const()[name = tensor("op_2901_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_2901_end_0 = const()[name = tensor("op_2901_end_0"), val = tensor([2, 77, 1, 128])]; tensor var_2901_end_mask_0 = const()[name = tensor("op_2901_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2901_cast_fp16 = slice_by_index(begin = var_2901_begin_0, end = var_2901_end_0, end_mask = var_2901_end_mask_0, x = transpose_4)[name = tensor("op_2901_cast_fp16")]; tensor var_2905_begin_0 = const()[name = tensor("op_2905_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_2905_end_0 = const()[name = tensor("op_2905_end_0"), val = tensor([2, 77, 1, 192])]; tensor var_2905_end_mask_0 = const()[name = tensor("op_2905_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2905_cast_fp16 = slice_by_index(begin = var_2905_begin_0, end = var_2905_end_0, end_mask = var_2905_end_mask_0, x = transpose_4)[name = tensor("op_2905_cast_fp16")]; tensor var_2909_begin_0 = const()[name = tensor("op_2909_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_2909_end_0 = const()[name = tensor("op_2909_end_0"), val = tensor([2, 77, 1, 256])]; tensor var_2909_end_mask_0 = const()[name = tensor("op_2909_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2909_cast_fp16 = slice_by_index(begin = var_2909_begin_0, end = var_2909_end_0, end_mask = var_2909_end_mask_0, x = transpose_4)[name = tensor("op_2909_cast_fp16")]; tensor var_2913_begin_0 = const()[name = tensor("op_2913_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_2913_end_0 = const()[name = tensor("op_2913_end_0"), val = tensor([2, 77, 1, 320])]; tensor var_2913_end_mask_0 = const()[name = tensor("op_2913_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2913_cast_fp16 = slice_by_index(begin = var_2913_begin_0, end = var_2913_end_0, end_mask = var_2913_end_mask_0, x = transpose_4)[name = tensor("op_2913_cast_fp16")]; tensor var_2917_begin_0 = const()[name = tensor("op_2917_begin_0"), val = tensor([0, 0, 0, 320])]; tensor var_2917_end_0 = const()[name = tensor("op_2917_end_0"), val = tensor([2, 77, 1, 384])]; tensor var_2917_end_mask_0 = const()[name = tensor("op_2917_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2917_cast_fp16 = slice_by_index(begin = var_2917_begin_0, end = var_2917_end_0, end_mask = var_2917_end_mask_0, x = transpose_4)[name = tensor("op_2917_cast_fp16")]; tensor var_2921_begin_0 = const()[name = tensor("op_2921_begin_0"), val = tensor([0, 0, 0, 384])]; tensor var_2921_end_0 = const()[name = tensor("op_2921_end_0"), val = tensor([2, 77, 1, 448])]; tensor var_2921_end_mask_0 = const()[name = tensor("op_2921_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2921_cast_fp16 = slice_by_index(begin = var_2921_begin_0, end = var_2921_end_0, end_mask = var_2921_end_mask_0, x = transpose_4)[name = tensor("op_2921_cast_fp16")]; tensor var_2925_begin_0 = const()[name = tensor("op_2925_begin_0"), val = tensor([0, 0, 0, 448])]; tensor var_2925_end_0 = const()[name = tensor("op_2925_end_0"), val = tensor([2, 77, 1, 512])]; tensor var_2925_end_mask_0 = const()[name = tensor("op_2925_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2925_cast_fp16 = slice_by_index(begin = var_2925_begin_0, end = var_2925_end_0, end_mask = var_2925_end_mask_0, x = transpose_4)[name = tensor("op_2925_cast_fp16")]; tensor var_2929_begin_0 = const()[name = tensor("op_2929_begin_0"), val = tensor([0, 0, 0, 512])]; tensor var_2929_end_0 = const()[name = tensor("op_2929_end_0"), val = tensor([2, 77, 1, 576])]; tensor var_2929_end_mask_0 = const()[name = tensor("op_2929_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2929_cast_fp16 = slice_by_index(begin = var_2929_begin_0, end = var_2929_end_0, end_mask = var_2929_end_mask_0, x = transpose_4)[name = tensor("op_2929_cast_fp16")]; tensor var_2933_begin_0 = const()[name = tensor("op_2933_begin_0"), val = tensor([0, 0, 0, 576])]; tensor var_2933_end_0 = const()[name = tensor("op_2933_end_0"), val = tensor([2, 77, 1, 640])]; tensor var_2933_end_mask_0 = const()[name = tensor("op_2933_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2933_cast_fp16 = slice_by_index(begin = var_2933_begin_0, end = var_2933_end_0, end_mask = var_2933_end_mask_0, x = transpose_4)[name = tensor("op_2933_cast_fp16")]; tensor var_2937_begin_0 = const()[name = tensor("op_2937_begin_0"), val = tensor([0, 0, 0, 640])]; tensor var_2937_end_0 = const()[name = tensor("op_2937_end_0"), val = tensor([2, 77, 1, 704])]; tensor var_2937_end_mask_0 = const()[name = tensor("op_2937_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2937_cast_fp16 = slice_by_index(begin = var_2937_begin_0, end = var_2937_end_0, end_mask = var_2937_end_mask_0, x = transpose_4)[name = tensor("op_2937_cast_fp16")]; tensor var_2941_begin_0 = const()[name = tensor("op_2941_begin_0"), val = tensor([0, 0, 0, 704])]; tensor var_2941_end_0 = const()[name = tensor("op_2941_end_0"), val = tensor([2, 77, 1, 768])]; tensor var_2941_end_mask_0 = const()[name = tensor("op_2941_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2941_cast_fp16 = slice_by_index(begin = var_2941_begin_0, end = var_2941_end_0, end_mask = var_2941_end_mask_0, x = transpose_4)[name = tensor("op_2941_cast_fp16")]; tensor var_2945_begin_0 = const()[name = tensor("op_2945_begin_0"), val = tensor([0, 0, 0, 768])]; tensor var_2945_end_0 = const()[name = tensor("op_2945_end_0"), val = tensor([2, 77, 1, 832])]; tensor var_2945_end_mask_0 = const()[name = tensor("op_2945_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2945_cast_fp16 = slice_by_index(begin = var_2945_begin_0, end = var_2945_end_0, end_mask = var_2945_end_mask_0, x = transpose_4)[name = tensor("op_2945_cast_fp16")]; tensor var_2949_begin_0 = const()[name = tensor("op_2949_begin_0"), val = tensor([0, 0, 0, 832])]; tensor var_2949_end_0 = const()[name = tensor("op_2949_end_0"), val = tensor([2, 77, 1, 896])]; tensor var_2949_end_mask_0 = const()[name = tensor("op_2949_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2949_cast_fp16 = slice_by_index(begin = var_2949_begin_0, end = var_2949_end_0, end_mask = var_2949_end_mask_0, x = transpose_4)[name = tensor("op_2949_cast_fp16")]; tensor var_2953_begin_0 = const()[name = tensor("op_2953_begin_0"), val = tensor([0, 0, 0, 896])]; tensor var_2953_end_0 = const()[name = tensor("op_2953_end_0"), val = tensor([2, 77, 1, 960])]; tensor var_2953_end_mask_0 = const()[name = tensor("op_2953_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2953_cast_fp16 = slice_by_index(begin = var_2953_begin_0, end = var_2953_end_0, end_mask = var_2953_end_mask_0, x = transpose_4)[name = tensor("op_2953_cast_fp16")]; tensor var_2957_begin_0 = const()[name = tensor("op_2957_begin_0"), val = tensor([0, 0, 0, 960])]; tensor var_2957_end_0 = const()[name = tensor("op_2957_end_0"), val = tensor([2, 77, 1, 1024])]; tensor var_2957_end_mask_0 = const()[name = tensor("op_2957_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2957_cast_fp16 = slice_by_index(begin = var_2957_begin_0, end = var_2957_end_0, end_mask = var_2957_end_mask_0, x = transpose_4)[name = tensor("op_2957_cast_fp16")]; tensor var_2961_begin_0 = const()[name = tensor("op_2961_begin_0"), val = tensor([0, 0, 0, 1024])]; tensor var_2961_end_0 = const()[name = tensor("op_2961_end_0"), val = tensor([2, 77, 1, 1088])]; tensor var_2961_end_mask_0 = const()[name = tensor("op_2961_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2961_cast_fp16 = slice_by_index(begin = var_2961_begin_0, end = var_2961_end_0, end_mask = var_2961_end_mask_0, x = transpose_4)[name = tensor("op_2961_cast_fp16")]; tensor var_2965_begin_0 = const()[name = tensor("op_2965_begin_0"), val = tensor([0, 0, 0, 1088])]; tensor var_2965_end_0 = const()[name = tensor("op_2965_end_0"), val = tensor([2, 77, 1, 1152])]; tensor var_2965_end_mask_0 = const()[name = tensor("op_2965_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2965_cast_fp16 = slice_by_index(begin = var_2965_begin_0, end = var_2965_end_0, end_mask = var_2965_end_mask_0, x = transpose_4)[name = tensor("op_2965_cast_fp16")]; tensor var_2969_begin_0 = const()[name = tensor("op_2969_begin_0"), val = tensor([0, 0, 0, 1152])]; tensor var_2969_end_0 = const()[name = tensor("op_2969_end_0"), val = tensor([2, 77, 1, 1216])]; tensor var_2969_end_mask_0 = const()[name = tensor("op_2969_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2969_cast_fp16 = slice_by_index(begin = var_2969_begin_0, end = var_2969_end_0, end_mask = var_2969_end_mask_0, x = transpose_4)[name = tensor("op_2969_cast_fp16")]; tensor var_2973_begin_0 = const()[name = tensor("op_2973_begin_0"), val = tensor([0, 0, 0, 1216])]; tensor var_2973_end_0 = const()[name = tensor("op_2973_end_0"), val = tensor([2, 77, 1, 1280])]; tensor var_2973_end_mask_0 = const()[name = tensor("op_2973_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_2973_cast_fp16 = slice_by_index(begin = var_2973_begin_0, end = var_2973_end_0, end_mask = var_2973_end_mask_0, x = transpose_4)[name = tensor("op_2973_cast_fp16")]; tensor var_2975_begin_0 = const()[name = tensor("op_2975_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_2975_end_0 = const()[name = tensor("op_2975_end_0"), val = tensor([2, 64, 1, 77])]; tensor var_2975_end_mask_0 = const()[name = tensor("op_2975_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2975_cast_fp16 = slice_by_index(begin = var_2975_begin_0, end = var_2975_end_0, end_mask = var_2975_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2975_cast_fp16")]; tensor var_2979_begin_0 = const()[name = tensor("op_2979_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_2979_end_0 = const()[name = tensor("op_2979_end_0"), val = tensor([2, 128, 1, 77])]; tensor var_2979_end_mask_0 = const()[name = tensor("op_2979_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2979_cast_fp16 = slice_by_index(begin = var_2979_begin_0, end = var_2979_end_0, end_mask = var_2979_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2979_cast_fp16")]; tensor var_2983_begin_0 = const()[name = tensor("op_2983_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_2983_end_0 = const()[name = tensor("op_2983_end_0"), val = tensor([2, 192, 1, 77])]; tensor var_2983_end_mask_0 = const()[name = tensor("op_2983_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2983_cast_fp16 = slice_by_index(begin = var_2983_begin_0, end = var_2983_end_0, end_mask = var_2983_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2983_cast_fp16")]; tensor var_2987_begin_0 = const()[name = tensor("op_2987_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_2987_end_0 = const()[name = tensor("op_2987_end_0"), val = tensor([2, 256, 1, 77])]; tensor var_2987_end_mask_0 = const()[name = tensor("op_2987_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2987_cast_fp16 = slice_by_index(begin = var_2987_begin_0, end = var_2987_end_0, end_mask = var_2987_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2987_cast_fp16")]; tensor var_2991_begin_0 = const()[name = tensor("op_2991_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_2991_end_0 = const()[name = tensor("op_2991_end_0"), val = tensor([2, 320, 1, 77])]; tensor var_2991_end_mask_0 = const()[name = tensor("op_2991_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2991_cast_fp16 = slice_by_index(begin = var_2991_begin_0, end = var_2991_end_0, end_mask = var_2991_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2991_cast_fp16")]; tensor var_2995_begin_0 = const()[name = tensor("op_2995_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_2995_end_0 = const()[name = tensor("op_2995_end_0"), val = tensor([2, 384, 1, 77])]; tensor var_2995_end_mask_0 = const()[name = tensor("op_2995_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2995_cast_fp16 = slice_by_index(begin = var_2995_begin_0, end = var_2995_end_0, end_mask = var_2995_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2995_cast_fp16")]; tensor var_2999_begin_0 = const()[name = tensor("op_2999_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_2999_end_0 = const()[name = tensor("op_2999_end_0"), val = tensor([2, 448, 1, 77])]; tensor var_2999_end_mask_0 = const()[name = tensor("op_2999_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_2999_cast_fp16 = slice_by_index(begin = var_2999_begin_0, end = var_2999_end_0, end_mask = var_2999_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_2999_cast_fp16")]; tensor var_3003_begin_0 = const()[name = tensor("op_3003_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_3003_end_0 = const()[name = tensor("op_3003_end_0"), val = tensor([2, 512, 1, 77])]; tensor var_3003_end_mask_0 = const()[name = tensor("op_3003_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3003_cast_fp16 = slice_by_index(begin = var_3003_begin_0, end = var_3003_end_0, end_mask = var_3003_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3003_cast_fp16")]; tensor var_3007_begin_0 = const()[name = tensor("op_3007_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_3007_end_0 = const()[name = tensor("op_3007_end_0"), val = tensor([2, 576, 1, 77])]; tensor var_3007_end_mask_0 = const()[name = tensor("op_3007_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3007_cast_fp16 = slice_by_index(begin = var_3007_begin_0, end = var_3007_end_0, end_mask = var_3007_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3007_cast_fp16")]; tensor var_3011_begin_0 = const()[name = tensor("op_3011_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_3011_end_0 = const()[name = tensor("op_3011_end_0"), val = tensor([2, 640, 1, 77])]; tensor var_3011_end_mask_0 = const()[name = tensor("op_3011_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3011_cast_fp16 = slice_by_index(begin = var_3011_begin_0, end = var_3011_end_0, end_mask = var_3011_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3011_cast_fp16")]; tensor var_3015_begin_0 = const()[name = tensor("op_3015_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_3015_end_0 = const()[name = tensor("op_3015_end_0"), val = tensor([2, 704, 1, 77])]; tensor var_3015_end_mask_0 = const()[name = tensor("op_3015_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3015_cast_fp16 = slice_by_index(begin = var_3015_begin_0, end = var_3015_end_0, end_mask = var_3015_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3015_cast_fp16")]; tensor var_3019_begin_0 = const()[name = tensor("op_3019_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_3019_end_0 = const()[name = tensor("op_3019_end_0"), val = tensor([2, 768, 1, 77])]; tensor var_3019_end_mask_0 = const()[name = tensor("op_3019_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3019_cast_fp16 = slice_by_index(begin = var_3019_begin_0, end = var_3019_end_0, end_mask = var_3019_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3019_cast_fp16")]; tensor var_3023_begin_0 = const()[name = tensor("op_3023_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_3023_end_0 = const()[name = tensor("op_3023_end_0"), val = tensor([2, 832, 1, 77])]; tensor var_3023_end_mask_0 = const()[name = tensor("op_3023_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3023_cast_fp16 = slice_by_index(begin = var_3023_begin_0, end = var_3023_end_0, end_mask = var_3023_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3023_cast_fp16")]; tensor var_3027_begin_0 = const()[name = tensor("op_3027_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_3027_end_0 = const()[name = tensor("op_3027_end_0"), val = tensor([2, 896, 1, 77])]; tensor var_3027_end_mask_0 = const()[name = tensor("op_3027_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3027_cast_fp16 = slice_by_index(begin = var_3027_begin_0, end = var_3027_end_0, end_mask = var_3027_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3027_cast_fp16")]; tensor var_3031_begin_0 = const()[name = tensor("op_3031_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_3031_end_0 = const()[name = tensor("op_3031_end_0"), val = tensor([2, 960, 1, 77])]; tensor var_3031_end_mask_0 = const()[name = tensor("op_3031_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3031_cast_fp16 = slice_by_index(begin = var_3031_begin_0, end = var_3031_end_0, end_mask = var_3031_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3031_cast_fp16")]; tensor var_3035_begin_0 = const()[name = tensor("op_3035_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_3035_end_0 = const()[name = tensor("op_3035_end_0"), val = tensor([2, 1024, 1, 77])]; tensor var_3035_end_mask_0 = const()[name = tensor("op_3035_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3035_cast_fp16 = slice_by_index(begin = var_3035_begin_0, end = var_3035_end_0, end_mask = var_3035_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3035_cast_fp16")]; tensor var_3039_begin_0 = const()[name = tensor("op_3039_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_3039_end_0 = const()[name = tensor("op_3039_end_0"), val = tensor([2, 1088, 1, 77])]; tensor var_3039_end_mask_0 = const()[name = tensor("op_3039_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3039_cast_fp16 = slice_by_index(begin = var_3039_begin_0, end = var_3039_end_0, end_mask = var_3039_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3039_cast_fp16")]; tensor var_3043_begin_0 = const()[name = tensor("op_3043_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_3043_end_0 = const()[name = tensor("op_3043_end_0"), val = tensor([2, 1152, 1, 77])]; tensor var_3043_end_mask_0 = const()[name = tensor("op_3043_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3043_cast_fp16 = slice_by_index(begin = var_3043_begin_0, end = var_3043_end_0, end_mask = var_3043_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3043_cast_fp16")]; tensor var_3047_begin_0 = const()[name = tensor("op_3047_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_3047_end_0 = const()[name = tensor("op_3047_end_0"), val = tensor([2, 1216, 1, 77])]; tensor var_3047_end_mask_0 = const()[name = tensor("op_3047_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3047_cast_fp16 = slice_by_index(begin = var_3047_begin_0, end = var_3047_end_0, end_mask = var_3047_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3047_cast_fp16")]; tensor var_3051_begin_0 = const()[name = tensor("op_3051_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_3051_end_0 = const()[name = tensor("op_3051_end_0"), val = tensor([2, 1280, 1, 77])]; tensor var_3051_end_mask_0 = const()[name = tensor("op_3051_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3051_cast_fp16 = slice_by_index(begin = var_3051_begin_0, end = var_3051_end_0, end_mask = var_3051_end_mask_0, x = v_19_cast_fp16)[name = tensor("op_3051_cast_fp16")]; tensor var_3055_equation_0 = const()[name = tensor("op_3055_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3055_cast_fp16 = einsum(equation = var_3055_equation_0, values = (var_2897_cast_fp16, var_2814_cast_fp16))[name = tensor("op_3055_cast_fp16")]; tensor var_3056_to_fp16 = const()[name = tensor("op_3056_to_fp16"), val = tensor(0x1p-3)]; tensor aw_161_cast_fp16 = mul(x = var_3055_cast_fp16, y = var_3056_to_fp16)[name = tensor("aw_161_cast_fp16")]; tensor var_3059_equation_0 = const()[name = tensor("op_3059_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3059_cast_fp16 = einsum(equation = var_3059_equation_0, values = (var_2901_cast_fp16, var_2818_cast_fp16))[name = tensor("op_3059_cast_fp16")]; tensor var_3060_to_fp16 = const()[name = tensor("op_3060_to_fp16"), val = tensor(0x1p-3)]; tensor aw_163_cast_fp16 = mul(x = var_3059_cast_fp16, y = var_3060_to_fp16)[name = tensor("aw_163_cast_fp16")]; tensor var_3063_equation_0 = const()[name = tensor("op_3063_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3063_cast_fp16 = einsum(equation = var_3063_equation_0, values = (var_2905_cast_fp16, var_2822_cast_fp16))[name = tensor("op_3063_cast_fp16")]; tensor var_3064_to_fp16 = const()[name = tensor("op_3064_to_fp16"), val = tensor(0x1p-3)]; tensor aw_165_cast_fp16 = mul(x = var_3063_cast_fp16, y = var_3064_to_fp16)[name = tensor("aw_165_cast_fp16")]; tensor var_3067_equation_0 = const()[name = tensor("op_3067_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3067_cast_fp16 = einsum(equation = var_3067_equation_0, values = (var_2909_cast_fp16, var_2826_cast_fp16))[name = tensor("op_3067_cast_fp16")]; tensor var_3068_to_fp16 = const()[name = tensor("op_3068_to_fp16"), val = tensor(0x1p-3)]; tensor aw_167_cast_fp16 = mul(x = var_3067_cast_fp16, y = var_3068_to_fp16)[name = tensor("aw_167_cast_fp16")]; tensor var_3071_equation_0 = const()[name = tensor("op_3071_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3071_cast_fp16 = einsum(equation = var_3071_equation_0, values = (var_2913_cast_fp16, var_2830_cast_fp16))[name = tensor("op_3071_cast_fp16")]; tensor var_3072_to_fp16 = const()[name = tensor("op_3072_to_fp16"), val = tensor(0x1p-3)]; tensor aw_169_cast_fp16 = mul(x = var_3071_cast_fp16, y = var_3072_to_fp16)[name = tensor("aw_169_cast_fp16")]; tensor var_3075_equation_0 = const()[name = tensor("op_3075_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3075_cast_fp16 = einsum(equation = var_3075_equation_0, values = (var_2917_cast_fp16, var_2834_cast_fp16))[name = tensor("op_3075_cast_fp16")]; tensor var_3076_to_fp16 = const()[name = tensor("op_3076_to_fp16"), val = tensor(0x1p-3)]; tensor aw_171_cast_fp16 = mul(x = var_3075_cast_fp16, y = var_3076_to_fp16)[name = tensor("aw_171_cast_fp16")]; tensor var_3079_equation_0 = const()[name = tensor("op_3079_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3079_cast_fp16 = einsum(equation = var_3079_equation_0, values = (var_2921_cast_fp16, var_2838_cast_fp16))[name = tensor("op_3079_cast_fp16")]; tensor var_3080_to_fp16 = const()[name = tensor("op_3080_to_fp16"), val = tensor(0x1p-3)]; tensor aw_173_cast_fp16 = mul(x = var_3079_cast_fp16, y = var_3080_to_fp16)[name = tensor("aw_173_cast_fp16")]; tensor var_3083_equation_0 = const()[name = tensor("op_3083_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3083_cast_fp16 = einsum(equation = var_3083_equation_0, values = (var_2925_cast_fp16, var_2842_cast_fp16))[name = tensor("op_3083_cast_fp16")]; tensor var_3084_to_fp16 = const()[name = tensor("op_3084_to_fp16"), val = tensor(0x1p-3)]; tensor aw_175_cast_fp16 = mul(x = var_3083_cast_fp16, y = var_3084_to_fp16)[name = tensor("aw_175_cast_fp16")]; tensor var_3087_equation_0 = const()[name = tensor("op_3087_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3087_cast_fp16 = einsum(equation = var_3087_equation_0, values = (var_2929_cast_fp16, var_2846_cast_fp16))[name = tensor("op_3087_cast_fp16")]; tensor var_3088_to_fp16 = const()[name = tensor("op_3088_to_fp16"), val = tensor(0x1p-3)]; tensor aw_177_cast_fp16 = mul(x = var_3087_cast_fp16, y = var_3088_to_fp16)[name = tensor("aw_177_cast_fp16")]; tensor var_3091_equation_0 = const()[name = tensor("op_3091_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3091_cast_fp16 = einsum(equation = var_3091_equation_0, values = (var_2933_cast_fp16, var_2850_cast_fp16))[name = tensor("op_3091_cast_fp16")]; tensor var_3092_to_fp16 = const()[name = tensor("op_3092_to_fp16"), val = tensor(0x1p-3)]; tensor aw_179_cast_fp16 = mul(x = var_3091_cast_fp16, y = var_3092_to_fp16)[name = tensor("aw_179_cast_fp16")]; tensor var_3095_equation_0 = const()[name = tensor("op_3095_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3095_cast_fp16 = einsum(equation = var_3095_equation_0, values = (var_2937_cast_fp16, var_2854_cast_fp16))[name = tensor("op_3095_cast_fp16")]; tensor var_3096_to_fp16 = const()[name = tensor("op_3096_to_fp16"), val = tensor(0x1p-3)]; tensor aw_181_cast_fp16 = mul(x = var_3095_cast_fp16, y = var_3096_to_fp16)[name = tensor("aw_181_cast_fp16")]; tensor var_3099_equation_0 = const()[name = tensor("op_3099_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3099_cast_fp16 = einsum(equation = var_3099_equation_0, values = (var_2941_cast_fp16, var_2858_cast_fp16))[name = tensor("op_3099_cast_fp16")]; tensor var_3100_to_fp16 = const()[name = tensor("op_3100_to_fp16"), val = tensor(0x1p-3)]; tensor aw_183_cast_fp16 = mul(x = var_3099_cast_fp16, y = var_3100_to_fp16)[name = tensor("aw_183_cast_fp16")]; tensor var_3103_equation_0 = const()[name = tensor("op_3103_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3103_cast_fp16 = einsum(equation = var_3103_equation_0, values = (var_2945_cast_fp16, var_2862_cast_fp16))[name = tensor("op_3103_cast_fp16")]; tensor var_3104_to_fp16 = const()[name = tensor("op_3104_to_fp16"), val = tensor(0x1p-3)]; tensor aw_185_cast_fp16 = mul(x = var_3103_cast_fp16, y = var_3104_to_fp16)[name = tensor("aw_185_cast_fp16")]; tensor var_3107_equation_0 = const()[name = tensor("op_3107_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3107_cast_fp16 = einsum(equation = var_3107_equation_0, values = (var_2949_cast_fp16, var_2866_cast_fp16))[name = tensor("op_3107_cast_fp16")]; tensor var_3108_to_fp16 = const()[name = tensor("op_3108_to_fp16"), val = tensor(0x1p-3)]; tensor aw_187_cast_fp16 = mul(x = var_3107_cast_fp16, y = var_3108_to_fp16)[name = tensor("aw_187_cast_fp16")]; tensor var_3111_equation_0 = const()[name = tensor("op_3111_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3111_cast_fp16 = einsum(equation = var_3111_equation_0, values = (var_2953_cast_fp16, var_2870_cast_fp16))[name = tensor("op_3111_cast_fp16")]; tensor var_3112_to_fp16 = const()[name = tensor("op_3112_to_fp16"), val = tensor(0x1p-3)]; tensor aw_189_cast_fp16 = mul(x = var_3111_cast_fp16, y = var_3112_to_fp16)[name = tensor("aw_189_cast_fp16")]; tensor var_3115_equation_0 = const()[name = tensor("op_3115_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3115_cast_fp16 = einsum(equation = var_3115_equation_0, values = (var_2957_cast_fp16, var_2874_cast_fp16))[name = tensor("op_3115_cast_fp16")]; tensor var_3116_to_fp16 = const()[name = tensor("op_3116_to_fp16"), val = tensor(0x1p-3)]; tensor aw_191_cast_fp16 = mul(x = var_3115_cast_fp16, y = var_3116_to_fp16)[name = tensor("aw_191_cast_fp16")]; tensor var_3119_equation_0 = const()[name = tensor("op_3119_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3119_cast_fp16 = einsum(equation = var_3119_equation_0, values = (var_2961_cast_fp16, var_2878_cast_fp16))[name = tensor("op_3119_cast_fp16")]; tensor var_3120_to_fp16 = const()[name = tensor("op_3120_to_fp16"), val = tensor(0x1p-3)]; tensor aw_193_cast_fp16 = mul(x = var_3119_cast_fp16, y = var_3120_to_fp16)[name = tensor("aw_193_cast_fp16")]; tensor var_3123_equation_0 = const()[name = tensor("op_3123_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3123_cast_fp16 = einsum(equation = var_3123_equation_0, values = (var_2965_cast_fp16, var_2882_cast_fp16))[name = tensor("op_3123_cast_fp16")]; tensor var_3124_to_fp16 = const()[name = tensor("op_3124_to_fp16"), val = tensor(0x1p-3)]; tensor aw_195_cast_fp16 = mul(x = var_3123_cast_fp16, y = var_3124_to_fp16)[name = tensor("aw_195_cast_fp16")]; tensor var_3127_equation_0 = const()[name = tensor("op_3127_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3127_cast_fp16 = einsum(equation = var_3127_equation_0, values = (var_2969_cast_fp16, var_2886_cast_fp16))[name = tensor("op_3127_cast_fp16")]; tensor var_3128_to_fp16 = const()[name = tensor("op_3128_to_fp16"), val = tensor(0x1p-3)]; tensor aw_197_cast_fp16 = mul(x = var_3127_cast_fp16, y = var_3128_to_fp16)[name = tensor("aw_197_cast_fp16")]; tensor var_3131_equation_0 = const()[name = tensor("op_3131_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3131_cast_fp16 = einsum(equation = var_3131_equation_0, values = (var_2973_cast_fp16, var_2890_cast_fp16))[name = tensor("op_3131_cast_fp16")]; tensor var_3132_to_fp16 = const()[name = tensor("op_3132_to_fp16"), val = tensor(0x1p-3)]; tensor aw_199_cast_fp16 = mul(x = var_3131_cast_fp16, y = var_3132_to_fp16)[name = tensor("aw_199_cast_fp16")]; tensor var_3134_cast_fp16 = softmax(axis = var_2254, x = aw_161_cast_fp16)[name = tensor("op_3134_cast_fp16")]; tensor var_3135_cast_fp16 = softmax(axis = var_2254, x = aw_163_cast_fp16)[name = tensor("op_3135_cast_fp16")]; tensor var_3136_cast_fp16 = softmax(axis = var_2254, x = aw_165_cast_fp16)[name = tensor("op_3136_cast_fp16")]; tensor var_3137_cast_fp16 = softmax(axis = var_2254, x = aw_167_cast_fp16)[name = tensor("op_3137_cast_fp16")]; tensor var_3138_cast_fp16 = softmax(axis = var_2254, x = aw_169_cast_fp16)[name = tensor("op_3138_cast_fp16")]; tensor var_3139_cast_fp16 = softmax(axis = var_2254, x = aw_171_cast_fp16)[name = tensor("op_3139_cast_fp16")]; tensor var_3140_cast_fp16 = softmax(axis = var_2254, x = aw_173_cast_fp16)[name = tensor("op_3140_cast_fp16")]; tensor var_3141_cast_fp16 = softmax(axis = var_2254, x = aw_175_cast_fp16)[name = tensor("op_3141_cast_fp16")]; tensor var_3142_cast_fp16 = softmax(axis = var_2254, x = aw_177_cast_fp16)[name = tensor("op_3142_cast_fp16")]; tensor var_3143_cast_fp16 = softmax(axis = var_2254, x = aw_179_cast_fp16)[name = tensor("op_3143_cast_fp16")]; tensor var_3144_cast_fp16 = softmax(axis = var_2254, x = aw_181_cast_fp16)[name = tensor("op_3144_cast_fp16")]; tensor var_3145_cast_fp16 = softmax(axis = var_2254, x = aw_183_cast_fp16)[name = tensor("op_3145_cast_fp16")]; tensor var_3146_cast_fp16 = softmax(axis = var_2254, x = aw_185_cast_fp16)[name = tensor("op_3146_cast_fp16")]; tensor var_3147_cast_fp16 = softmax(axis = var_2254, x = aw_187_cast_fp16)[name = tensor("op_3147_cast_fp16")]; tensor var_3148_cast_fp16 = softmax(axis = var_2254, x = aw_189_cast_fp16)[name = tensor("op_3148_cast_fp16")]; tensor var_3149_cast_fp16 = softmax(axis = var_2254, x = aw_191_cast_fp16)[name = tensor("op_3149_cast_fp16")]; tensor var_3150_cast_fp16 = softmax(axis = var_2254, x = aw_193_cast_fp16)[name = tensor("op_3150_cast_fp16")]; tensor var_3151_cast_fp16 = softmax(axis = var_2254, x = aw_195_cast_fp16)[name = tensor("op_3151_cast_fp16")]; tensor var_3152_cast_fp16 = softmax(axis = var_2254, x = aw_197_cast_fp16)[name = tensor("op_3152_cast_fp16")]; tensor var_3153_cast_fp16 = softmax(axis = var_2254, x = aw_199_cast_fp16)[name = tensor("op_3153_cast_fp16")]; tensor var_3155_equation_0 = const()[name = tensor("op_3155_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3155_cast_fp16 = einsum(equation = var_3155_equation_0, values = (var_2975_cast_fp16, var_3134_cast_fp16))[name = tensor("op_3155_cast_fp16")]; tensor var_3157_equation_0 = const()[name = tensor("op_3157_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3157_cast_fp16 = einsum(equation = var_3157_equation_0, values = (var_2979_cast_fp16, var_3135_cast_fp16))[name = tensor("op_3157_cast_fp16")]; tensor var_3159_equation_0 = const()[name = tensor("op_3159_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3159_cast_fp16 = einsum(equation = var_3159_equation_0, values = (var_2983_cast_fp16, var_3136_cast_fp16))[name = tensor("op_3159_cast_fp16")]; tensor var_3161_equation_0 = const()[name = tensor("op_3161_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3161_cast_fp16 = einsum(equation = var_3161_equation_0, values = (var_2987_cast_fp16, var_3137_cast_fp16))[name = tensor("op_3161_cast_fp16")]; tensor var_3163_equation_0 = const()[name = tensor("op_3163_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3163_cast_fp16 = einsum(equation = var_3163_equation_0, values = (var_2991_cast_fp16, var_3138_cast_fp16))[name = tensor("op_3163_cast_fp16")]; tensor var_3165_equation_0 = const()[name = tensor("op_3165_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3165_cast_fp16 = einsum(equation = var_3165_equation_0, values = (var_2995_cast_fp16, var_3139_cast_fp16))[name = tensor("op_3165_cast_fp16")]; tensor var_3167_equation_0 = const()[name = tensor("op_3167_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3167_cast_fp16 = einsum(equation = var_3167_equation_0, values = (var_2999_cast_fp16, var_3140_cast_fp16))[name = tensor("op_3167_cast_fp16")]; tensor var_3169_equation_0 = const()[name = tensor("op_3169_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3169_cast_fp16 = einsum(equation = var_3169_equation_0, values = (var_3003_cast_fp16, var_3141_cast_fp16))[name = tensor("op_3169_cast_fp16")]; tensor var_3171_equation_0 = const()[name = tensor("op_3171_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3171_cast_fp16 = einsum(equation = var_3171_equation_0, values = (var_3007_cast_fp16, var_3142_cast_fp16))[name = tensor("op_3171_cast_fp16")]; tensor var_3173_equation_0 = const()[name = tensor("op_3173_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3173_cast_fp16 = einsum(equation = var_3173_equation_0, values = (var_3011_cast_fp16, var_3143_cast_fp16))[name = tensor("op_3173_cast_fp16")]; tensor var_3175_equation_0 = const()[name = tensor("op_3175_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3175_cast_fp16 = einsum(equation = var_3175_equation_0, values = (var_3015_cast_fp16, var_3144_cast_fp16))[name = tensor("op_3175_cast_fp16")]; tensor var_3177_equation_0 = const()[name = tensor("op_3177_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3177_cast_fp16 = einsum(equation = var_3177_equation_0, values = (var_3019_cast_fp16, var_3145_cast_fp16))[name = tensor("op_3177_cast_fp16")]; tensor var_3179_equation_0 = const()[name = tensor("op_3179_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3179_cast_fp16 = einsum(equation = var_3179_equation_0, values = (var_3023_cast_fp16, var_3146_cast_fp16))[name = tensor("op_3179_cast_fp16")]; tensor var_3181_equation_0 = const()[name = tensor("op_3181_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3181_cast_fp16 = einsum(equation = var_3181_equation_0, values = (var_3027_cast_fp16, var_3147_cast_fp16))[name = tensor("op_3181_cast_fp16")]; tensor var_3183_equation_0 = const()[name = tensor("op_3183_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3183_cast_fp16 = einsum(equation = var_3183_equation_0, values = (var_3031_cast_fp16, var_3148_cast_fp16))[name = tensor("op_3183_cast_fp16")]; tensor var_3185_equation_0 = const()[name = tensor("op_3185_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3185_cast_fp16 = einsum(equation = var_3185_equation_0, values = (var_3035_cast_fp16, var_3149_cast_fp16))[name = tensor("op_3185_cast_fp16")]; tensor var_3187_equation_0 = const()[name = tensor("op_3187_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3187_cast_fp16 = einsum(equation = var_3187_equation_0, values = (var_3039_cast_fp16, var_3150_cast_fp16))[name = tensor("op_3187_cast_fp16")]; tensor var_3189_equation_0 = const()[name = tensor("op_3189_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3189_cast_fp16 = einsum(equation = var_3189_equation_0, values = (var_3043_cast_fp16, var_3151_cast_fp16))[name = tensor("op_3189_cast_fp16")]; tensor var_3191_equation_0 = const()[name = tensor("op_3191_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3191_cast_fp16 = einsum(equation = var_3191_equation_0, values = (var_3047_cast_fp16, var_3152_cast_fp16))[name = tensor("op_3191_cast_fp16")]; tensor var_3193_equation_0 = const()[name = tensor("op_3193_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3193_cast_fp16 = einsum(equation = var_3193_equation_0, values = (var_3051_cast_fp16, var_3153_cast_fp16))[name = tensor("op_3193_cast_fp16")]; tensor input_135_interleave_0 = const()[name = tensor("input_135_interleave_0"), val = tensor(false)]; tensor input_135_cast_fp16 = concat(axis = var_2254, interleave = input_135_interleave_0, values = (var_3155_cast_fp16, var_3157_cast_fp16, var_3159_cast_fp16, var_3161_cast_fp16, var_3163_cast_fp16, var_3165_cast_fp16, var_3167_cast_fp16, var_3169_cast_fp16, var_3171_cast_fp16, var_3173_cast_fp16, var_3175_cast_fp16, var_3177_cast_fp16, var_3179_cast_fp16, var_3181_cast_fp16, var_3183_cast_fp16, var_3185_cast_fp16, var_3187_cast_fp16, var_3189_cast_fp16, var_3191_cast_fp16, var_3193_cast_fp16))[name = tensor("input_135_cast_fp16")]; tensor var_3199 = const()[name = tensor("op_3199"), val = tensor([1, 1])]; tensor var_3201 = const()[name = tensor("op_3201"), val = tensor([1, 1])]; tensor var_3203_pad_type_0 = const()[name = tensor("op_3203_pad_type_0"), val = tensor("custom")]; tensor var_3203_pad_0 = const()[name = tensor("op_3203_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(174892608)))]; tensor down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178169472)))]; tensor var_3203_cast_fp16 = conv(bias = down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_3201, groups = var_2254, pad = var_3203_pad_0, pad_type = var_3203_pad_type_0, strides = var_3199, weight = down_blocks_2_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_135_cast_fp16)[name = tensor("op_3203_cast_fp16")]; tensor inputs_29_cast_fp16 = add(x = var_3203_cast_fp16, y = inputs_27_cast_fp16)[name = tensor("inputs_29_cast_fp16")]; tensor var_3207 = const()[name = tensor("op_3207"), val = tensor([1])]; tensor channels_mean_29_cast_fp16 = reduce_mean(axes = var_3207, keep_dims = var_2249, x = inputs_29_cast_fp16)[name = tensor("channels_mean_29_cast_fp16")]; tensor zero_mean_29_cast_fp16 = sub(x = inputs_29_cast_fp16, y = channels_mean_29_cast_fp16)[name = tensor("zero_mean_29_cast_fp16")]; tensor zero_mean_sq_29_cast_fp16 = mul(x = zero_mean_29_cast_fp16, y = zero_mean_29_cast_fp16)[name = tensor("zero_mean_sq_29_cast_fp16")]; tensor var_3211 = const()[name = tensor("op_3211"), val = tensor([1])]; tensor var_3212_cast_fp16 = reduce_mean(axes = var_3211, keep_dims = var_2249, x = zero_mean_sq_29_cast_fp16)[name = tensor("op_3212_cast_fp16")]; tensor var_3213_to_fp16 = const()[name = tensor("op_3213_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3214_cast_fp16 = add(x = var_3212_cast_fp16, y = var_3213_to_fp16)[name = tensor("op_3214_cast_fp16")]; tensor denom_29_epsilon_0_to_fp16 = const()[name = tensor("denom_29_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_29_cast_fp16 = rsqrt(epsilon = denom_29_epsilon_0_to_fp16, x = var_3214_cast_fp16)[name = tensor("denom_29_cast_fp16")]; tensor out_29_cast_fp16 = mul(x = zero_mean_29_cast_fp16, y = denom_29_cast_fp16)[name = tensor("out_29_cast_fp16")]; tensor var_3218_to_fp16 = const()[name = tensor("op_3218_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178172096)))]; tensor var_3219_cast_fp16 = add(x = out_29_cast_fp16, y = var_3218_to_fp16)[name = tensor("op_3219_cast_fp16")]; tensor var_3221_to_fp16 = const()[name = tensor("op_3221_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178174720)))]; tensor input_137_cast_fp16 = mul(x = var_3219_cast_fp16, y = var_3221_to_fp16)[name = tensor("input_137_cast_fp16")]; tensor var_3229 = const()[name = tensor("op_3229"), val = tensor([1, 1])]; tensor var_3231 = const()[name = tensor("op_3231"), val = tensor([1, 1])]; tensor var_3233_pad_type_0 = const()[name = tensor("op_3233_pad_type_0"), val = tensor("custom")]; tensor var_3233_pad_0 = const()[name = tensor("op_3233_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(178177344)))]; tensor down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(204391808)))]; tensor var_3233_cast_fp16 = conv(bias = down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_3231, groups = var_2254, pad = var_3233_pad_0, pad_type = var_3233_pad_type_0, strides = var_3229, weight = down_blocks_2_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_137_cast_fp16)[name = tensor("op_3233_cast_fp16")]; tensor var_3234_split_sizes_0 = const()[name = tensor("op_3234_split_sizes_0"), val = tensor([5120, 5120])]; tensor var_3234_axis_0 = const()[name = tensor("op_3234_axis_0"), val = tensor(1)]; tensor var_3234_cast_fp16_0, tensor var_3234_cast_fp16_1 = split(axis = var_3234_axis_0, split_sizes = var_3234_split_sizes_0, x = var_3233_cast_fp16)[name = tensor("op_3234_cast_fp16")]; tensor var_3236_mode_0 = const()[name = tensor("op_3236_mode_0"), val = tensor("EXACT")]; tensor var_3236_cast_fp16 = gelu(mode = var_3236_mode_0, x = var_3234_cast_fp16_1)[name = tensor("op_3236_cast_fp16")]; tensor input_139_cast_fp16 = mul(x = var_3234_cast_fp16_0, y = var_3236_cast_fp16)[name = tensor("input_139_cast_fp16")]; tensor var_3240 = const()[name = tensor("op_3240"), val = tensor([1, 1])]; tensor var_3242 = const()[name = tensor("op_3242"), val = tensor([1, 1])]; tensor var_3244_pad_type_0 = const()[name = tensor("op_3244_pad_type_0"), val = tensor("custom")]; tensor var_3244_pad_0 = const()[name = tensor("op_3244_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(204412352)))]; tensor down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217519616)))]; tensor var_3244_cast_fp16 = conv(bias = down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_3242, groups = var_2254, pad = var_3244_pad_0, pad_type = var_3244_pad_type_0, strides = var_3240, weight = down_blocks_2_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_139_cast_fp16)[name = tensor("op_3244_cast_fp16")]; tensor hidden_states_87_cast_fp16 = add(x = var_3244_cast_fp16, y = inputs_29_cast_fp16)[name = tensor("hidden_states_87_cast_fp16")]; tensor var_3246 = const()[name = tensor("op_3246"), val = tensor([2, 1280, 12, 12])]; tensor input_141_cast_fp16 = reshape(shape = var_3246, x = hidden_states_87_cast_fp16)[name = tensor("input_141_cast_fp16")]; tensor var_3250 = const()[name = tensor("op_3250"), val = tensor([1, 1])]; tensor var_3252 = const()[name = tensor("op_3252"), val = tensor([1, 1])]; tensor hidden_states_89_pad_type_0 = const()[name = tensor("hidden_states_89_pad_type_0"), val = tensor("custom")]; tensor hidden_states_89_pad_0 = const()[name = tensor("hidden_states_89_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_0_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217522240)))]; tensor down_blocks_2_attentions_0_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_0_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220799104)))]; tensor hidden_states_89_cast_fp16 = conv(bias = down_blocks_2_attentions_0_proj_out_bias_to_fp16, dilations = var_3252, groups = var_2254, pad = hidden_states_89_pad_0, pad_type = hidden_states_89_pad_type_0, strides = var_3250, weight = down_blocks_2_attentions_0_proj_out_weight_to_fp16, x = input_141_cast_fp16)[name = tensor("hidden_states_89_cast_fp16")]; tensor input_143_cast_fp16_1 = add(x = hidden_states_89_cast_fp16, y = hidden_states_77_cast_fp16)[name = tensor("input_143_cast_fp16")]; tensor reshape_60_shape_0 = const()[name = tensor("reshape_60_shape_0"), val = tensor([2, 32, 40, 12, 12])]; tensor reshape_60_cast_fp16 = reshape(shape = reshape_60_shape_0, x = input_143_cast_fp16_1)[name = tensor("reshape_60_cast_fp16")]; tensor reduce_mean_45_axes_0 = const()[name = tensor("reduce_mean_45_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_45_keep_dims_0 = const()[name = tensor("reduce_mean_45_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_45_cast_fp16 = reduce_mean(axes = reduce_mean_45_axes_0, keep_dims = reduce_mean_45_keep_dims_0, x = reshape_60_cast_fp16)[name = tensor("reduce_mean_45_cast_fp16")]; tensor sub_30_cast_fp16 = sub(x = reshape_60_cast_fp16, y = reduce_mean_45_cast_fp16)[name = tensor("sub_30_cast_fp16")]; tensor square_15_cast_fp16 = square(x = sub_30_cast_fp16)[name = tensor("square_15_cast_fp16")]; tensor reduce_mean_47_axes_0 = const()[name = tensor("reduce_mean_47_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_47_keep_dims_0 = const()[name = tensor("reduce_mean_47_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_47_cast_fp16 = reduce_mean(axes = reduce_mean_47_axes_0, keep_dims = reduce_mean_47_keep_dims_0, x = square_15_cast_fp16)[name = tensor("reduce_mean_47_cast_fp16")]; tensor add_30_y_0_to_fp16 = const()[name = tensor("add_30_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_30_cast_fp16 = add(x = reduce_mean_47_cast_fp16, y = add_30_y_0_to_fp16)[name = tensor("add_30_cast_fp16")]; tensor sqrt_15_cast_fp16 = sqrt(x = add_30_cast_fp16)[name = tensor("sqrt_15_cast_fp16")]; tensor real_div_15_cast_fp16 = real_div(x = sub_30_cast_fp16, y = sqrt_15_cast_fp16)[name = tensor("real_div_15_cast_fp16")]; tensor reshape_61_shape_0 = const()[name = tensor("reshape_61_shape_0"), val = tensor([2, 1280, 12, 12])]; tensor reshape_61_cast_fp16 = reshape(shape = reshape_61_shape_0, x = real_div_15_cast_fp16)[name = tensor("reshape_61_cast_fp16")]; tensor add_31_gamma_0_to_fp16 = const()[name = tensor("add_31_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220801728)))]; tensor add_31_beta_0_to_fp16 = const()[name = tensor("add_31_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220804352)))]; tensor add_31_epsilon_0_to_fp16 = const()[name = tensor("add_31_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_31_cast_fp16 = batch_norm(beta = add_31_beta_0_to_fp16, epsilon = add_31_epsilon_0_to_fp16, gamma = add_31_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_61_cast_fp16)[name = tensor("add_31_cast_fp16")]; tensor input_147_cast_fp16 = silu(x = add_31_cast_fp16)[name = tensor("input_147_cast_fp16")]; tensor var_3267 = const()[name = tensor("op_3267"), val = tensor([1, 1])]; tensor var_3269 = const()[name = tensor("op_3269"), val = tensor([1, 1])]; tensor hidden_states_91_pad_type_0 = const()[name = tensor("hidden_states_91_pad_type_0"), val = tensor("custom")]; tensor hidden_states_91_pad_0 = const()[name = tensor("hidden_states_91_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_2_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(220806976)))]; tensor down_blocks_2_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250298240)))]; tensor hidden_states_91_cast_fp16 = conv(bias = down_blocks_2_resnets_1_conv1_bias_to_fp16, dilations = var_3269, groups = var_2254, pad = hidden_states_91_pad_0, pad_type = hidden_states_91_pad_type_0, strides = var_3267, weight = down_blocks_2_resnets_1_conv1_weight_to_fp16, x = input_147_cast_fp16)[name = tensor("hidden_states_91_cast_fp16")]; tensor var_3275 = const()[name = tensor("op_3275"), val = tensor([1, 1])]; tensor var_3277 = const()[name = tensor("op_3277"), val = tensor([1, 1])]; tensor temb_11_pad_type_0 = const()[name = tensor("temb_11_pad_type_0"), val = tensor("custom")]; tensor temb_11_pad_0 = const()[name = tensor("temb_11_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(250300864)))]; tensor down_blocks_2_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253577728)))]; tensor temb_11_cast_fp16 = conv(bias = down_blocks_2_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_3277, groups = var_2254, pad = temb_11_pad_0, pad_type = temb_11_pad_type_0, strides = var_3275, weight = down_blocks_2_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_11_cast_fp16")]; tensor input_151_cast_fp16 = add(x = hidden_states_91_cast_fp16, y = temb_11_cast_fp16)[name = tensor("input_151_cast_fp16")]; tensor reshape_64_shape_0 = const()[name = tensor("reshape_64_shape_0"), val = tensor([2, 32, 40, 12, 12])]; tensor reshape_64_cast_fp16 = reshape(shape = reshape_64_shape_0, x = input_151_cast_fp16)[name = tensor("reshape_64_cast_fp16")]; tensor reduce_mean_48_axes_0 = const()[name = tensor("reduce_mean_48_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_48_keep_dims_0 = const()[name = tensor("reduce_mean_48_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_48_cast_fp16 = reduce_mean(axes = reduce_mean_48_axes_0, keep_dims = reduce_mean_48_keep_dims_0, x = reshape_64_cast_fp16)[name = tensor("reduce_mean_48_cast_fp16")]; tensor sub_32_cast_fp16 = sub(x = reshape_64_cast_fp16, y = reduce_mean_48_cast_fp16)[name = tensor("sub_32_cast_fp16")]; tensor square_16_cast_fp16 = square(x = sub_32_cast_fp16)[name = tensor("square_16_cast_fp16")]; tensor reduce_mean_50_axes_0 = const()[name = tensor("reduce_mean_50_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_50_keep_dims_0 = const()[name = tensor("reduce_mean_50_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_50_cast_fp16 = reduce_mean(axes = reduce_mean_50_axes_0, keep_dims = reduce_mean_50_keep_dims_0, x = square_16_cast_fp16)[name = tensor("reduce_mean_50_cast_fp16")]; tensor add_32_y_0_to_fp16 = const()[name = tensor("add_32_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_32_cast_fp16 = add(x = reduce_mean_50_cast_fp16, y = add_32_y_0_to_fp16)[name = tensor("add_32_cast_fp16")]; tensor sqrt_16_cast_fp16 = sqrt(x = add_32_cast_fp16)[name = tensor("sqrt_16_cast_fp16")]; tensor real_div_16_cast_fp16 = real_div(x = sub_32_cast_fp16, y = sqrt_16_cast_fp16)[name = tensor("real_div_16_cast_fp16")]; tensor reshape_65_shape_0 = const()[name = tensor("reshape_65_shape_0"), val = tensor([2, 1280, 12, 12])]; tensor reshape_65_cast_fp16 = reshape(shape = reshape_65_shape_0, x = real_div_16_cast_fp16)[name = tensor("reshape_65_cast_fp16")]; tensor add_33_gamma_0_to_fp16 = const()[name = tensor("add_33_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253580352)))]; tensor add_33_beta_0_to_fp16 = const()[name = tensor("add_33_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253582976)))]; tensor add_33_epsilon_0_to_fp16 = const()[name = tensor("add_33_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_33_cast_fp16 = batch_norm(beta = add_33_beta_0_to_fp16, epsilon = add_33_epsilon_0_to_fp16, gamma = add_33_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_65_cast_fp16)[name = tensor("add_33_cast_fp16")]; tensor input_155_cast_fp16 = silu(x = add_33_cast_fp16)[name = tensor("input_155_cast_fp16")]; tensor var_3287 = const()[name = tensor("op_3287"), val = tensor([1, 1])]; tensor var_3289 = const()[name = tensor("op_3289"), val = tensor([1, 1])]; tensor hidden_states_93_pad_type_0 = const()[name = tensor("hidden_states_93_pad_type_0"), val = tensor("custom")]; tensor hidden_states_93_pad_0 = const()[name = tensor("hidden_states_93_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_2_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253585600)))]; tensor down_blocks_2_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_2_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(283076864)))]; tensor hidden_states_93_cast_fp16 = conv(bias = down_blocks_2_resnets_1_conv2_bias_to_fp16, dilations = var_3289, groups = var_2254, pad = hidden_states_93_pad_0, pad_type = hidden_states_93_pad_type_0, strides = var_3287, weight = down_blocks_2_resnets_1_conv2_weight_to_fp16, x = input_155_cast_fp16)[name = tensor("hidden_states_93_cast_fp16")]; tensor hidden_states_95_cast_fp16 = add(x = input_143_cast_fp16_1, y = hidden_states_93_cast_fp16)[name = tensor("hidden_states_95_cast_fp16")]; tensor reshape_68_shape_0 = const()[name = tensor("reshape_68_shape_0"), val = tensor([2, 32, 40, 12, 12])]; tensor reshape_68_cast_fp16 = reshape(shape = reshape_68_shape_0, x = hidden_states_95_cast_fp16)[name = tensor("reshape_68_cast_fp16")]; tensor reduce_mean_51_axes_0 = const()[name = tensor("reduce_mean_51_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_51_keep_dims_0 = const()[name = tensor("reduce_mean_51_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_51_cast_fp16 = reduce_mean(axes = reduce_mean_51_axes_0, keep_dims = reduce_mean_51_keep_dims_0, x = reshape_68_cast_fp16)[name = tensor("reduce_mean_51_cast_fp16")]; tensor sub_34_cast_fp16 = sub(x = reshape_68_cast_fp16, y = reduce_mean_51_cast_fp16)[name = tensor("sub_34_cast_fp16")]; tensor square_17_cast_fp16 = square(x = sub_34_cast_fp16)[name = tensor("square_17_cast_fp16")]; tensor reduce_mean_53_axes_0 = const()[name = tensor("reduce_mean_53_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_53_keep_dims_0 = const()[name = tensor("reduce_mean_53_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_53_cast_fp16 = reduce_mean(axes = reduce_mean_53_axes_0, keep_dims = reduce_mean_53_keep_dims_0, x = square_17_cast_fp16)[name = tensor("reduce_mean_53_cast_fp16")]; tensor add_34_y_0_to_fp16 = const()[name = tensor("add_34_y_0_to_fp16"), val = tensor(0x1.1p-20)]; tensor add_34_cast_fp16 = add(x = reduce_mean_53_cast_fp16, y = add_34_y_0_to_fp16)[name = tensor("add_34_cast_fp16")]; tensor sqrt_17_cast_fp16 = sqrt(x = add_34_cast_fp16)[name = tensor("sqrt_17_cast_fp16")]; tensor real_div_17_cast_fp16 = real_div(x = sub_34_cast_fp16, y = sqrt_17_cast_fp16)[name = tensor("real_div_17_cast_fp16")]; tensor reshape_69_shape_0 = const()[name = tensor("reshape_69_shape_0"), val = tensor([2, 1280, 12, 12])]; tensor reshape_69_cast_fp16 = reshape(shape = reshape_69_shape_0, x = real_div_17_cast_fp16)[name = tensor("reshape_69_cast_fp16")]; tensor add_35_gamma_0_to_fp16 = const()[name = tensor("add_35_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(283079488)))]; tensor add_35_beta_0_to_fp16 = const()[name = tensor("add_35_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(283082112)))]; tensor add_35_epsilon_0_to_fp16 = const()[name = tensor("add_35_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_35_cast_fp16 = batch_norm(beta = add_35_beta_0_to_fp16, epsilon = add_35_epsilon_0_to_fp16, gamma = add_35_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_69_cast_fp16)[name = tensor("add_35_cast_fp16")]; tensor var_3309 = const()[name = tensor("op_3309"), val = tensor([1, 1])]; tensor var_3311 = const()[name = tensor("op_3311"), val = tensor([1, 1])]; tensor hidden_states_97_pad_type_0 = const()[name = tensor("hidden_states_97_pad_type_0"), val = tensor("custom")]; tensor hidden_states_97_pad_0 = const()[name = tensor("hidden_states_97_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_proj_in_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(283084736)))]; tensor down_blocks_2_attentions_1_proj_in_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286361600)))]; tensor hidden_states_97_cast_fp16 = conv(bias = down_blocks_2_attentions_1_proj_in_bias_to_fp16, dilations = var_3311, groups = var_2254, pad = hidden_states_97_pad_0, pad_type = hidden_states_97_pad_type_0, strides = var_3309, weight = down_blocks_2_attentions_1_proj_in_weight_to_fp16, x = add_35_cast_fp16)[name = tensor("hidden_states_97_cast_fp16")]; tensor var_3316 = const()[name = tensor("op_3316"), val = tensor([2, 1280, 1, 144])]; tensor inputs_31_cast_fp16 = reshape(shape = var_3316, x = hidden_states_97_cast_fp16)[name = tensor("inputs_31_cast_fp16")]; tensor var_3326 = const()[name = tensor("op_3326"), val = tensor([1])]; tensor channels_mean_31_cast_fp16 = reduce_mean(axes = var_3326, keep_dims = var_2249, x = inputs_31_cast_fp16)[name = tensor("channels_mean_31_cast_fp16")]; tensor zero_mean_31_cast_fp16 = sub(x = inputs_31_cast_fp16, y = channels_mean_31_cast_fp16)[name = tensor("zero_mean_31_cast_fp16")]; tensor zero_mean_sq_31_cast_fp16 = mul(x = zero_mean_31_cast_fp16, y = zero_mean_31_cast_fp16)[name = tensor("zero_mean_sq_31_cast_fp16")]; tensor var_3330 = const()[name = tensor("op_3330"), val = tensor([1])]; tensor var_3331_cast_fp16 = reduce_mean(axes = var_3330, keep_dims = var_2249, x = zero_mean_sq_31_cast_fp16)[name = tensor("op_3331_cast_fp16")]; tensor var_3332_to_fp16 = const()[name = tensor("op_3332_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3333_cast_fp16 = add(x = var_3331_cast_fp16, y = var_3332_to_fp16)[name = tensor("op_3333_cast_fp16")]; tensor denom_31_epsilon_0_to_fp16 = const()[name = tensor("denom_31_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_31_cast_fp16 = rsqrt(epsilon = denom_31_epsilon_0_to_fp16, x = var_3333_cast_fp16)[name = tensor("denom_31_cast_fp16")]; tensor out_31_cast_fp16 = mul(x = zero_mean_31_cast_fp16, y = denom_31_cast_fp16)[name = tensor("out_31_cast_fp16")]; tensor var_3337_to_fp16 = const()[name = tensor("op_3337_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286364224)))]; tensor var_3338_cast_fp16 = add(x = out_31_cast_fp16, y = var_3337_to_fp16)[name = tensor("op_3338_cast_fp16")]; tensor var_3340_to_fp16 = const()[name = tensor("op_3340_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286366848)))]; tensor hidden_states_99_cast_fp16 = mul(x = var_3338_cast_fp16, y = var_3340_to_fp16)[name = tensor("hidden_states_99_cast_fp16")]; tensor var_3347 = const()[name = tensor("op_3347"), val = tensor([1, 1])]; tensor var_3349 = const()[name = tensor("op_3349"), val = tensor([1, 1])]; tensor q_21_pad_type_0 = const()[name = tensor("q_21_pad_type_0"), val = tensor("custom")]; tensor q_21_pad_0 = const()[name = tensor("q_21_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286369472)))]; tensor q_21_cast_fp16 = conv(dilations = var_3349, groups = var_2254, pad = q_21_pad_0, pad_type = q_21_pad_type_0, strides = var_3347, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_99_cast_fp16)[name = tensor("q_21_cast_fp16")]; tensor var_3353 = const()[name = tensor("op_3353"), val = tensor([1, 1])]; tensor var_3355 = const()[name = tensor("op_3355"), val = tensor([1, 1])]; tensor k_41_pad_type_0 = const()[name = tensor("k_41_pad_type_0"), val = tensor("custom")]; tensor k_41_pad_0 = const()[name = tensor("k_41_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(289646336)))]; tensor k_41_cast_fp16 = conv(dilations = var_3355, groups = var_2254, pad = k_41_pad_0, pad_type = k_41_pad_type_0, strides = var_3353, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_99_cast_fp16)[name = tensor("k_41_cast_fp16")]; tensor var_3359 = const()[name = tensor("op_3359"), val = tensor([1, 1])]; tensor var_3361 = const()[name = tensor("op_3361"), val = tensor([1, 1])]; tensor v_21_pad_type_0 = const()[name = tensor("v_21_pad_type_0"), val = tensor("custom")]; tensor v_21_pad_0 = const()[name = tensor("v_21_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(292923200)))]; tensor v_21_cast_fp16 = conv(dilations = var_3361, groups = var_2254, pad = v_21_pad_0, pad_type = v_21_pad_type_0, strides = var_3359, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_99_cast_fp16)[name = tensor("v_21_cast_fp16")]; tensor var_3365_begin_0 = const()[name = tensor("op_3365_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_3365_end_0 = const()[name = tensor("op_3365_end_0"), val = tensor([2, 64, 1, 144])]; tensor var_3365_end_mask_0 = const()[name = tensor("op_3365_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3365_cast_fp16 = slice_by_index(begin = var_3365_begin_0, end = var_3365_end_0, end_mask = var_3365_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3365_cast_fp16")]; tensor var_3369_begin_0 = const()[name = tensor("op_3369_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_3369_end_0 = const()[name = tensor("op_3369_end_0"), val = tensor([2, 128, 1, 144])]; tensor var_3369_end_mask_0 = const()[name = tensor("op_3369_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3369_cast_fp16 = slice_by_index(begin = var_3369_begin_0, end = var_3369_end_0, end_mask = var_3369_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3369_cast_fp16")]; tensor var_3373_begin_0 = const()[name = tensor("op_3373_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_3373_end_0 = const()[name = tensor("op_3373_end_0"), val = tensor([2, 192, 1, 144])]; tensor var_3373_end_mask_0 = const()[name = tensor("op_3373_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3373_cast_fp16 = slice_by_index(begin = var_3373_begin_0, end = var_3373_end_0, end_mask = var_3373_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3373_cast_fp16")]; tensor var_3377_begin_0 = const()[name = tensor("op_3377_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_3377_end_0 = const()[name = tensor("op_3377_end_0"), val = tensor([2, 256, 1, 144])]; tensor var_3377_end_mask_0 = const()[name = tensor("op_3377_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3377_cast_fp16 = slice_by_index(begin = var_3377_begin_0, end = var_3377_end_0, end_mask = var_3377_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3377_cast_fp16")]; tensor var_3381_begin_0 = const()[name = tensor("op_3381_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_3381_end_0 = const()[name = tensor("op_3381_end_0"), val = tensor([2, 320, 1, 144])]; tensor var_3381_end_mask_0 = const()[name = tensor("op_3381_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3381_cast_fp16 = slice_by_index(begin = var_3381_begin_0, end = var_3381_end_0, end_mask = var_3381_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3381_cast_fp16")]; tensor var_3385_begin_0 = const()[name = tensor("op_3385_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_3385_end_0 = const()[name = tensor("op_3385_end_0"), val = tensor([2, 384, 1, 144])]; tensor var_3385_end_mask_0 = const()[name = tensor("op_3385_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3385_cast_fp16 = slice_by_index(begin = var_3385_begin_0, end = var_3385_end_0, end_mask = var_3385_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3385_cast_fp16")]; tensor var_3389_begin_0 = const()[name = tensor("op_3389_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_3389_end_0 = const()[name = tensor("op_3389_end_0"), val = tensor([2, 448, 1, 144])]; tensor var_3389_end_mask_0 = const()[name = tensor("op_3389_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3389_cast_fp16 = slice_by_index(begin = var_3389_begin_0, end = var_3389_end_0, end_mask = var_3389_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3389_cast_fp16")]; tensor var_3393_begin_0 = const()[name = tensor("op_3393_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_3393_end_0 = const()[name = tensor("op_3393_end_0"), val = tensor([2, 512, 1, 144])]; tensor var_3393_end_mask_0 = const()[name = tensor("op_3393_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3393_cast_fp16 = slice_by_index(begin = var_3393_begin_0, end = var_3393_end_0, end_mask = var_3393_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3393_cast_fp16")]; tensor var_3397_begin_0 = const()[name = tensor("op_3397_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_3397_end_0 = const()[name = tensor("op_3397_end_0"), val = tensor([2, 576, 1, 144])]; tensor var_3397_end_mask_0 = const()[name = tensor("op_3397_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3397_cast_fp16 = slice_by_index(begin = var_3397_begin_0, end = var_3397_end_0, end_mask = var_3397_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3397_cast_fp16")]; tensor var_3401_begin_0 = const()[name = tensor("op_3401_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_3401_end_0 = const()[name = tensor("op_3401_end_0"), val = tensor([2, 640, 1, 144])]; tensor var_3401_end_mask_0 = const()[name = tensor("op_3401_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3401_cast_fp16 = slice_by_index(begin = var_3401_begin_0, end = var_3401_end_0, end_mask = var_3401_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3401_cast_fp16")]; tensor var_3405_begin_0 = const()[name = tensor("op_3405_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_3405_end_0 = const()[name = tensor("op_3405_end_0"), val = tensor([2, 704, 1, 144])]; tensor var_3405_end_mask_0 = const()[name = tensor("op_3405_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3405_cast_fp16 = slice_by_index(begin = var_3405_begin_0, end = var_3405_end_0, end_mask = var_3405_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3405_cast_fp16")]; tensor var_3409_begin_0 = const()[name = tensor("op_3409_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_3409_end_0 = const()[name = tensor("op_3409_end_0"), val = tensor([2, 768, 1, 144])]; tensor var_3409_end_mask_0 = const()[name = tensor("op_3409_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3409_cast_fp16 = slice_by_index(begin = var_3409_begin_0, end = var_3409_end_0, end_mask = var_3409_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3409_cast_fp16")]; tensor var_3413_begin_0 = const()[name = tensor("op_3413_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_3413_end_0 = const()[name = tensor("op_3413_end_0"), val = tensor([2, 832, 1, 144])]; tensor var_3413_end_mask_0 = const()[name = tensor("op_3413_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3413_cast_fp16 = slice_by_index(begin = var_3413_begin_0, end = var_3413_end_0, end_mask = var_3413_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3413_cast_fp16")]; tensor var_3417_begin_0 = const()[name = tensor("op_3417_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_3417_end_0 = const()[name = tensor("op_3417_end_0"), val = tensor([2, 896, 1, 144])]; tensor var_3417_end_mask_0 = const()[name = tensor("op_3417_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3417_cast_fp16 = slice_by_index(begin = var_3417_begin_0, end = var_3417_end_0, end_mask = var_3417_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3417_cast_fp16")]; tensor var_3421_begin_0 = const()[name = tensor("op_3421_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_3421_end_0 = const()[name = tensor("op_3421_end_0"), val = tensor([2, 960, 1, 144])]; tensor var_3421_end_mask_0 = const()[name = tensor("op_3421_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3421_cast_fp16 = slice_by_index(begin = var_3421_begin_0, end = var_3421_end_0, end_mask = var_3421_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3421_cast_fp16")]; tensor var_3425_begin_0 = const()[name = tensor("op_3425_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_3425_end_0 = const()[name = tensor("op_3425_end_0"), val = tensor([2, 1024, 1, 144])]; tensor var_3425_end_mask_0 = const()[name = tensor("op_3425_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3425_cast_fp16 = slice_by_index(begin = var_3425_begin_0, end = var_3425_end_0, end_mask = var_3425_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3425_cast_fp16")]; tensor var_3429_begin_0 = const()[name = tensor("op_3429_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_3429_end_0 = const()[name = tensor("op_3429_end_0"), val = tensor([2, 1088, 1, 144])]; tensor var_3429_end_mask_0 = const()[name = tensor("op_3429_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3429_cast_fp16 = slice_by_index(begin = var_3429_begin_0, end = var_3429_end_0, end_mask = var_3429_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3429_cast_fp16")]; tensor var_3433_begin_0 = const()[name = tensor("op_3433_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_3433_end_0 = const()[name = tensor("op_3433_end_0"), val = tensor([2, 1152, 1, 144])]; tensor var_3433_end_mask_0 = const()[name = tensor("op_3433_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3433_cast_fp16 = slice_by_index(begin = var_3433_begin_0, end = var_3433_end_0, end_mask = var_3433_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3433_cast_fp16")]; tensor var_3437_begin_0 = const()[name = tensor("op_3437_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_3437_end_0 = const()[name = tensor("op_3437_end_0"), val = tensor([2, 1216, 1, 144])]; tensor var_3437_end_mask_0 = const()[name = tensor("op_3437_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3437_cast_fp16 = slice_by_index(begin = var_3437_begin_0, end = var_3437_end_0, end_mask = var_3437_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3437_cast_fp16")]; tensor var_3441_begin_0 = const()[name = tensor("op_3441_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_3441_end_0 = const()[name = tensor("op_3441_end_0"), val = tensor([2, 1280, 1, 144])]; tensor var_3441_end_mask_0 = const()[name = tensor("op_3441_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3441_cast_fp16 = slice_by_index(begin = var_3441_begin_0, end = var_3441_end_0, end_mask = var_3441_end_mask_0, x = q_21_cast_fp16)[name = tensor("op_3441_cast_fp16")]; tensor k_43_perm_0 = const()[name = tensor("k_43_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_3448_begin_0 = const()[name = tensor("op_3448_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_3448_end_0 = const()[name = tensor("op_3448_end_0"), val = tensor([2, 144, 1, 64])]; tensor var_3448_end_mask_0 = const()[name = tensor("op_3448_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_3 = transpose(perm = k_43_perm_0, x = k_41_cast_fp16)[name = tensor("transpose_3")]; tensor var_3448_cast_fp16 = slice_by_index(begin = var_3448_begin_0, end = var_3448_end_0, end_mask = var_3448_end_mask_0, x = transpose_3)[name = tensor("op_3448_cast_fp16")]; tensor var_3452_begin_0 = const()[name = tensor("op_3452_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_3452_end_0 = const()[name = tensor("op_3452_end_0"), val = tensor([2, 144, 1, 128])]; tensor var_3452_end_mask_0 = const()[name = tensor("op_3452_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3452_cast_fp16 = slice_by_index(begin = var_3452_begin_0, end = var_3452_end_0, end_mask = var_3452_end_mask_0, x = transpose_3)[name = tensor("op_3452_cast_fp16")]; tensor var_3456_begin_0 = const()[name = tensor("op_3456_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_3456_end_0 = const()[name = tensor("op_3456_end_0"), val = tensor([2, 144, 1, 192])]; tensor var_3456_end_mask_0 = const()[name = tensor("op_3456_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3456_cast_fp16 = slice_by_index(begin = var_3456_begin_0, end = var_3456_end_0, end_mask = var_3456_end_mask_0, x = transpose_3)[name = tensor("op_3456_cast_fp16")]; tensor var_3460_begin_0 = const()[name = tensor("op_3460_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_3460_end_0 = const()[name = tensor("op_3460_end_0"), val = tensor([2, 144, 1, 256])]; tensor var_3460_end_mask_0 = const()[name = tensor("op_3460_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3460_cast_fp16 = slice_by_index(begin = var_3460_begin_0, end = var_3460_end_0, end_mask = var_3460_end_mask_0, x = transpose_3)[name = tensor("op_3460_cast_fp16")]; tensor var_3464_begin_0 = const()[name = tensor("op_3464_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_3464_end_0 = const()[name = tensor("op_3464_end_0"), val = tensor([2, 144, 1, 320])]; tensor var_3464_end_mask_0 = const()[name = tensor("op_3464_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3464_cast_fp16 = slice_by_index(begin = var_3464_begin_0, end = var_3464_end_0, end_mask = var_3464_end_mask_0, x = transpose_3)[name = tensor("op_3464_cast_fp16")]; tensor var_3468_begin_0 = const()[name = tensor("op_3468_begin_0"), val = tensor([0, 0, 0, 320])]; tensor var_3468_end_0 = const()[name = tensor("op_3468_end_0"), val = tensor([2, 144, 1, 384])]; tensor var_3468_end_mask_0 = const()[name = tensor("op_3468_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3468_cast_fp16 = slice_by_index(begin = var_3468_begin_0, end = var_3468_end_0, end_mask = var_3468_end_mask_0, x = transpose_3)[name = tensor("op_3468_cast_fp16")]; tensor var_3472_begin_0 = const()[name = tensor("op_3472_begin_0"), val = tensor([0, 0, 0, 384])]; tensor var_3472_end_0 = const()[name = tensor("op_3472_end_0"), val = tensor([2, 144, 1, 448])]; tensor var_3472_end_mask_0 = const()[name = tensor("op_3472_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3472_cast_fp16 = slice_by_index(begin = var_3472_begin_0, end = var_3472_end_0, end_mask = var_3472_end_mask_0, x = transpose_3)[name = tensor("op_3472_cast_fp16")]; tensor var_3476_begin_0 = const()[name = tensor("op_3476_begin_0"), val = tensor([0, 0, 0, 448])]; tensor var_3476_end_0 = const()[name = tensor("op_3476_end_0"), val = tensor([2, 144, 1, 512])]; tensor var_3476_end_mask_0 = const()[name = tensor("op_3476_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3476_cast_fp16 = slice_by_index(begin = var_3476_begin_0, end = var_3476_end_0, end_mask = var_3476_end_mask_0, x = transpose_3)[name = tensor("op_3476_cast_fp16")]; tensor var_3480_begin_0 = const()[name = tensor("op_3480_begin_0"), val = tensor([0, 0, 0, 512])]; tensor var_3480_end_0 = const()[name = tensor("op_3480_end_0"), val = tensor([2, 144, 1, 576])]; tensor var_3480_end_mask_0 = const()[name = tensor("op_3480_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3480_cast_fp16 = slice_by_index(begin = var_3480_begin_0, end = var_3480_end_0, end_mask = var_3480_end_mask_0, x = transpose_3)[name = tensor("op_3480_cast_fp16")]; tensor var_3484_begin_0 = const()[name = tensor("op_3484_begin_0"), val = tensor([0, 0, 0, 576])]; tensor var_3484_end_0 = const()[name = tensor("op_3484_end_0"), val = tensor([2, 144, 1, 640])]; tensor var_3484_end_mask_0 = const()[name = tensor("op_3484_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3484_cast_fp16 = slice_by_index(begin = var_3484_begin_0, end = var_3484_end_0, end_mask = var_3484_end_mask_0, x = transpose_3)[name = tensor("op_3484_cast_fp16")]; tensor var_3488_begin_0 = const()[name = tensor("op_3488_begin_0"), val = tensor([0, 0, 0, 640])]; tensor var_3488_end_0 = const()[name = tensor("op_3488_end_0"), val = tensor([2, 144, 1, 704])]; tensor var_3488_end_mask_0 = const()[name = tensor("op_3488_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3488_cast_fp16 = slice_by_index(begin = var_3488_begin_0, end = var_3488_end_0, end_mask = var_3488_end_mask_0, x = transpose_3)[name = tensor("op_3488_cast_fp16")]; tensor var_3492_begin_0 = const()[name = tensor("op_3492_begin_0"), val = tensor([0, 0, 0, 704])]; tensor var_3492_end_0 = const()[name = tensor("op_3492_end_0"), val = tensor([2, 144, 1, 768])]; tensor var_3492_end_mask_0 = const()[name = tensor("op_3492_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3492_cast_fp16 = slice_by_index(begin = var_3492_begin_0, end = var_3492_end_0, end_mask = var_3492_end_mask_0, x = transpose_3)[name = tensor("op_3492_cast_fp16")]; tensor var_3496_begin_0 = const()[name = tensor("op_3496_begin_0"), val = tensor([0, 0, 0, 768])]; tensor var_3496_end_0 = const()[name = tensor("op_3496_end_0"), val = tensor([2, 144, 1, 832])]; tensor var_3496_end_mask_0 = const()[name = tensor("op_3496_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3496_cast_fp16 = slice_by_index(begin = var_3496_begin_0, end = var_3496_end_0, end_mask = var_3496_end_mask_0, x = transpose_3)[name = tensor("op_3496_cast_fp16")]; tensor var_3500_begin_0 = const()[name = tensor("op_3500_begin_0"), val = tensor([0, 0, 0, 832])]; tensor var_3500_end_0 = const()[name = tensor("op_3500_end_0"), val = tensor([2, 144, 1, 896])]; tensor var_3500_end_mask_0 = const()[name = tensor("op_3500_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3500_cast_fp16 = slice_by_index(begin = var_3500_begin_0, end = var_3500_end_0, end_mask = var_3500_end_mask_0, x = transpose_3)[name = tensor("op_3500_cast_fp16")]; tensor var_3504_begin_0 = const()[name = tensor("op_3504_begin_0"), val = tensor([0, 0, 0, 896])]; tensor var_3504_end_0 = const()[name = tensor("op_3504_end_0"), val = tensor([2, 144, 1, 960])]; tensor var_3504_end_mask_0 = const()[name = tensor("op_3504_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3504_cast_fp16 = slice_by_index(begin = var_3504_begin_0, end = var_3504_end_0, end_mask = var_3504_end_mask_0, x = transpose_3)[name = tensor("op_3504_cast_fp16")]; tensor var_3508_begin_0 = const()[name = tensor("op_3508_begin_0"), val = tensor([0, 0, 0, 960])]; tensor var_3508_end_0 = const()[name = tensor("op_3508_end_0"), val = tensor([2, 144, 1, 1024])]; tensor var_3508_end_mask_0 = const()[name = tensor("op_3508_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3508_cast_fp16 = slice_by_index(begin = var_3508_begin_0, end = var_3508_end_0, end_mask = var_3508_end_mask_0, x = transpose_3)[name = tensor("op_3508_cast_fp16")]; tensor var_3512_begin_0 = const()[name = tensor("op_3512_begin_0"), val = tensor([0, 0, 0, 1024])]; tensor var_3512_end_0 = const()[name = tensor("op_3512_end_0"), val = tensor([2, 144, 1, 1088])]; tensor var_3512_end_mask_0 = const()[name = tensor("op_3512_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3512_cast_fp16 = slice_by_index(begin = var_3512_begin_0, end = var_3512_end_0, end_mask = var_3512_end_mask_0, x = transpose_3)[name = tensor("op_3512_cast_fp16")]; tensor var_3516_begin_0 = const()[name = tensor("op_3516_begin_0"), val = tensor([0, 0, 0, 1088])]; tensor var_3516_end_0 = const()[name = tensor("op_3516_end_0"), val = tensor([2, 144, 1, 1152])]; tensor var_3516_end_mask_0 = const()[name = tensor("op_3516_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3516_cast_fp16 = slice_by_index(begin = var_3516_begin_0, end = var_3516_end_0, end_mask = var_3516_end_mask_0, x = transpose_3)[name = tensor("op_3516_cast_fp16")]; tensor var_3520_begin_0 = const()[name = tensor("op_3520_begin_0"), val = tensor([0, 0, 0, 1152])]; tensor var_3520_end_0 = const()[name = tensor("op_3520_end_0"), val = tensor([2, 144, 1, 1216])]; tensor var_3520_end_mask_0 = const()[name = tensor("op_3520_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3520_cast_fp16 = slice_by_index(begin = var_3520_begin_0, end = var_3520_end_0, end_mask = var_3520_end_mask_0, x = transpose_3)[name = tensor("op_3520_cast_fp16")]; tensor var_3524_begin_0 = const()[name = tensor("op_3524_begin_0"), val = tensor([0, 0, 0, 1216])]; tensor var_3524_end_0 = const()[name = tensor("op_3524_end_0"), val = tensor([2, 144, 1, 1280])]; tensor var_3524_end_mask_0 = const()[name = tensor("op_3524_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3524_cast_fp16 = slice_by_index(begin = var_3524_begin_0, end = var_3524_end_0, end_mask = var_3524_end_mask_0, x = transpose_3)[name = tensor("op_3524_cast_fp16")]; tensor var_3526_begin_0 = const()[name = tensor("op_3526_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_3526_end_0 = const()[name = tensor("op_3526_end_0"), val = tensor([2, 64, 1, 144])]; tensor var_3526_end_mask_0 = const()[name = tensor("op_3526_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3526_cast_fp16 = slice_by_index(begin = var_3526_begin_0, end = var_3526_end_0, end_mask = var_3526_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3526_cast_fp16")]; tensor var_3530_begin_0 = const()[name = tensor("op_3530_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_3530_end_0 = const()[name = tensor("op_3530_end_0"), val = tensor([2, 128, 1, 144])]; tensor var_3530_end_mask_0 = const()[name = tensor("op_3530_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3530_cast_fp16 = slice_by_index(begin = var_3530_begin_0, end = var_3530_end_0, end_mask = var_3530_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3530_cast_fp16")]; tensor var_3534_begin_0 = const()[name = tensor("op_3534_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_3534_end_0 = const()[name = tensor("op_3534_end_0"), val = tensor([2, 192, 1, 144])]; tensor var_3534_end_mask_0 = const()[name = tensor("op_3534_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3534_cast_fp16 = slice_by_index(begin = var_3534_begin_0, end = var_3534_end_0, end_mask = var_3534_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3534_cast_fp16")]; tensor var_3538_begin_0 = const()[name = tensor("op_3538_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_3538_end_0 = const()[name = tensor("op_3538_end_0"), val = tensor([2, 256, 1, 144])]; tensor var_3538_end_mask_0 = const()[name = tensor("op_3538_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3538_cast_fp16 = slice_by_index(begin = var_3538_begin_0, end = var_3538_end_0, end_mask = var_3538_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3538_cast_fp16")]; tensor var_3542_begin_0 = const()[name = tensor("op_3542_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_3542_end_0 = const()[name = tensor("op_3542_end_0"), val = tensor([2, 320, 1, 144])]; tensor var_3542_end_mask_0 = const()[name = tensor("op_3542_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3542_cast_fp16 = slice_by_index(begin = var_3542_begin_0, end = var_3542_end_0, end_mask = var_3542_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3542_cast_fp16")]; tensor var_3546_begin_0 = const()[name = tensor("op_3546_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_3546_end_0 = const()[name = tensor("op_3546_end_0"), val = tensor([2, 384, 1, 144])]; tensor var_3546_end_mask_0 = const()[name = tensor("op_3546_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3546_cast_fp16 = slice_by_index(begin = var_3546_begin_0, end = var_3546_end_0, end_mask = var_3546_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3546_cast_fp16")]; tensor var_3550_begin_0 = const()[name = tensor("op_3550_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_3550_end_0 = const()[name = tensor("op_3550_end_0"), val = tensor([2, 448, 1, 144])]; tensor var_3550_end_mask_0 = const()[name = tensor("op_3550_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3550_cast_fp16 = slice_by_index(begin = var_3550_begin_0, end = var_3550_end_0, end_mask = var_3550_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3550_cast_fp16")]; tensor var_3554_begin_0 = const()[name = tensor("op_3554_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_3554_end_0 = const()[name = tensor("op_3554_end_0"), val = tensor([2, 512, 1, 144])]; tensor var_3554_end_mask_0 = const()[name = tensor("op_3554_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3554_cast_fp16 = slice_by_index(begin = var_3554_begin_0, end = var_3554_end_0, end_mask = var_3554_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3554_cast_fp16")]; tensor var_3558_begin_0 = const()[name = tensor("op_3558_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_3558_end_0 = const()[name = tensor("op_3558_end_0"), val = tensor([2, 576, 1, 144])]; tensor var_3558_end_mask_0 = const()[name = tensor("op_3558_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3558_cast_fp16 = slice_by_index(begin = var_3558_begin_0, end = var_3558_end_0, end_mask = var_3558_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3558_cast_fp16")]; tensor var_3562_begin_0 = const()[name = tensor("op_3562_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_3562_end_0 = const()[name = tensor("op_3562_end_0"), val = tensor([2, 640, 1, 144])]; tensor var_3562_end_mask_0 = const()[name = tensor("op_3562_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3562_cast_fp16 = slice_by_index(begin = var_3562_begin_0, end = var_3562_end_0, end_mask = var_3562_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3562_cast_fp16")]; tensor var_3566_begin_0 = const()[name = tensor("op_3566_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_3566_end_0 = const()[name = tensor("op_3566_end_0"), val = tensor([2, 704, 1, 144])]; tensor var_3566_end_mask_0 = const()[name = tensor("op_3566_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3566_cast_fp16 = slice_by_index(begin = var_3566_begin_0, end = var_3566_end_0, end_mask = var_3566_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3566_cast_fp16")]; tensor var_3570_begin_0 = const()[name = tensor("op_3570_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_3570_end_0 = const()[name = tensor("op_3570_end_0"), val = tensor([2, 768, 1, 144])]; tensor var_3570_end_mask_0 = const()[name = tensor("op_3570_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3570_cast_fp16 = slice_by_index(begin = var_3570_begin_0, end = var_3570_end_0, end_mask = var_3570_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3570_cast_fp16")]; tensor var_3574_begin_0 = const()[name = tensor("op_3574_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_3574_end_0 = const()[name = tensor("op_3574_end_0"), val = tensor([2, 832, 1, 144])]; tensor var_3574_end_mask_0 = const()[name = tensor("op_3574_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3574_cast_fp16 = slice_by_index(begin = var_3574_begin_0, end = var_3574_end_0, end_mask = var_3574_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3574_cast_fp16")]; tensor var_3578_begin_0 = const()[name = tensor("op_3578_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_3578_end_0 = const()[name = tensor("op_3578_end_0"), val = tensor([2, 896, 1, 144])]; tensor var_3578_end_mask_0 = const()[name = tensor("op_3578_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3578_cast_fp16 = slice_by_index(begin = var_3578_begin_0, end = var_3578_end_0, end_mask = var_3578_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3578_cast_fp16")]; tensor var_3582_begin_0 = const()[name = tensor("op_3582_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_3582_end_0 = const()[name = tensor("op_3582_end_0"), val = tensor([2, 960, 1, 144])]; tensor var_3582_end_mask_0 = const()[name = tensor("op_3582_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3582_cast_fp16 = slice_by_index(begin = var_3582_begin_0, end = var_3582_end_0, end_mask = var_3582_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3582_cast_fp16")]; tensor var_3586_begin_0 = const()[name = tensor("op_3586_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_3586_end_0 = const()[name = tensor("op_3586_end_0"), val = tensor([2, 1024, 1, 144])]; tensor var_3586_end_mask_0 = const()[name = tensor("op_3586_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3586_cast_fp16 = slice_by_index(begin = var_3586_begin_0, end = var_3586_end_0, end_mask = var_3586_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3586_cast_fp16")]; tensor var_3590_begin_0 = const()[name = tensor("op_3590_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_3590_end_0 = const()[name = tensor("op_3590_end_0"), val = tensor([2, 1088, 1, 144])]; tensor var_3590_end_mask_0 = const()[name = tensor("op_3590_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3590_cast_fp16 = slice_by_index(begin = var_3590_begin_0, end = var_3590_end_0, end_mask = var_3590_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3590_cast_fp16")]; tensor var_3594_begin_0 = const()[name = tensor("op_3594_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_3594_end_0 = const()[name = tensor("op_3594_end_0"), val = tensor([2, 1152, 1, 144])]; tensor var_3594_end_mask_0 = const()[name = tensor("op_3594_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3594_cast_fp16 = slice_by_index(begin = var_3594_begin_0, end = var_3594_end_0, end_mask = var_3594_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3594_cast_fp16")]; tensor var_3598_begin_0 = const()[name = tensor("op_3598_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_3598_end_0 = const()[name = tensor("op_3598_end_0"), val = tensor([2, 1216, 1, 144])]; tensor var_3598_end_mask_0 = const()[name = tensor("op_3598_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3598_cast_fp16 = slice_by_index(begin = var_3598_begin_0, end = var_3598_end_0, end_mask = var_3598_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3598_cast_fp16")]; tensor var_3602_begin_0 = const()[name = tensor("op_3602_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_3602_end_0 = const()[name = tensor("op_3602_end_0"), val = tensor([2, 1280, 1, 144])]; tensor var_3602_end_mask_0 = const()[name = tensor("op_3602_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3602_cast_fp16 = slice_by_index(begin = var_3602_begin_0, end = var_3602_end_0, end_mask = var_3602_end_mask_0, x = v_21_cast_fp16)[name = tensor("op_3602_cast_fp16")]; tensor var_3606_equation_0 = const()[name = tensor("op_3606_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3606_cast_fp16 = einsum(equation = var_3606_equation_0, values = (var_3448_cast_fp16, var_3365_cast_fp16))[name = tensor("op_3606_cast_fp16")]; tensor var_3607_to_fp16 = const()[name = tensor("op_3607_to_fp16"), val = tensor(0x1p-3)]; tensor aw_201_cast_fp16 = mul(x = var_3606_cast_fp16, y = var_3607_to_fp16)[name = tensor("aw_201_cast_fp16")]; tensor var_3610_equation_0 = const()[name = tensor("op_3610_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3610_cast_fp16 = einsum(equation = var_3610_equation_0, values = (var_3452_cast_fp16, var_3369_cast_fp16))[name = tensor("op_3610_cast_fp16")]; tensor var_3611_to_fp16 = const()[name = tensor("op_3611_to_fp16"), val = tensor(0x1p-3)]; tensor aw_203_cast_fp16 = mul(x = var_3610_cast_fp16, y = var_3611_to_fp16)[name = tensor("aw_203_cast_fp16")]; tensor var_3614_equation_0 = const()[name = tensor("op_3614_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3614_cast_fp16 = einsum(equation = var_3614_equation_0, values = (var_3456_cast_fp16, var_3373_cast_fp16))[name = tensor("op_3614_cast_fp16")]; tensor var_3615_to_fp16 = const()[name = tensor("op_3615_to_fp16"), val = tensor(0x1p-3)]; tensor aw_205_cast_fp16 = mul(x = var_3614_cast_fp16, y = var_3615_to_fp16)[name = tensor("aw_205_cast_fp16")]; tensor var_3618_equation_0 = const()[name = tensor("op_3618_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3618_cast_fp16 = einsum(equation = var_3618_equation_0, values = (var_3460_cast_fp16, var_3377_cast_fp16))[name = tensor("op_3618_cast_fp16")]; tensor var_3619_to_fp16 = const()[name = tensor("op_3619_to_fp16"), val = tensor(0x1p-3)]; tensor aw_207_cast_fp16 = mul(x = var_3618_cast_fp16, y = var_3619_to_fp16)[name = tensor("aw_207_cast_fp16")]; tensor var_3622_equation_0 = const()[name = tensor("op_3622_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3622_cast_fp16 = einsum(equation = var_3622_equation_0, values = (var_3464_cast_fp16, var_3381_cast_fp16))[name = tensor("op_3622_cast_fp16")]; tensor var_3623_to_fp16 = const()[name = tensor("op_3623_to_fp16"), val = tensor(0x1p-3)]; tensor aw_209_cast_fp16 = mul(x = var_3622_cast_fp16, y = var_3623_to_fp16)[name = tensor("aw_209_cast_fp16")]; tensor var_3626_equation_0 = const()[name = tensor("op_3626_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3626_cast_fp16 = einsum(equation = var_3626_equation_0, values = (var_3468_cast_fp16, var_3385_cast_fp16))[name = tensor("op_3626_cast_fp16")]; tensor var_3627_to_fp16 = const()[name = tensor("op_3627_to_fp16"), val = tensor(0x1p-3)]; tensor aw_211_cast_fp16 = mul(x = var_3626_cast_fp16, y = var_3627_to_fp16)[name = tensor("aw_211_cast_fp16")]; tensor var_3630_equation_0 = const()[name = tensor("op_3630_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3630_cast_fp16 = einsum(equation = var_3630_equation_0, values = (var_3472_cast_fp16, var_3389_cast_fp16))[name = tensor("op_3630_cast_fp16")]; tensor var_3631_to_fp16 = const()[name = tensor("op_3631_to_fp16"), val = tensor(0x1p-3)]; tensor aw_213_cast_fp16 = mul(x = var_3630_cast_fp16, y = var_3631_to_fp16)[name = tensor("aw_213_cast_fp16")]; tensor var_3634_equation_0 = const()[name = tensor("op_3634_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3634_cast_fp16 = einsum(equation = var_3634_equation_0, values = (var_3476_cast_fp16, var_3393_cast_fp16))[name = tensor("op_3634_cast_fp16")]; tensor var_3635_to_fp16 = const()[name = tensor("op_3635_to_fp16"), val = tensor(0x1p-3)]; tensor aw_215_cast_fp16 = mul(x = var_3634_cast_fp16, y = var_3635_to_fp16)[name = tensor("aw_215_cast_fp16")]; tensor var_3638_equation_0 = const()[name = tensor("op_3638_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3638_cast_fp16 = einsum(equation = var_3638_equation_0, values = (var_3480_cast_fp16, var_3397_cast_fp16))[name = tensor("op_3638_cast_fp16")]; tensor var_3639_to_fp16 = const()[name = tensor("op_3639_to_fp16"), val = tensor(0x1p-3)]; tensor aw_217_cast_fp16 = mul(x = var_3638_cast_fp16, y = var_3639_to_fp16)[name = tensor("aw_217_cast_fp16")]; tensor var_3642_equation_0 = const()[name = tensor("op_3642_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3642_cast_fp16 = einsum(equation = var_3642_equation_0, values = (var_3484_cast_fp16, var_3401_cast_fp16))[name = tensor("op_3642_cast_fp16")]; tensor var_3643_to_fp16 = const()[name = tensor("op_3643_to_fp16"), val = tensor(0x1p-3)]; tensor aw_219_cast_fp16 = mul(x = var_3642_cast_fp16, y = var_3643_to_fp16)[name = tensor("aw_219_cast_fp16")]; tensor var_3646_equation_0 = const()[name = tensor("op_3646_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3646_cast_fp16 = einsum(equation = var_3646_equation_0, values = (var_3488_cast_fp16, var_3405_cast_fp16))[name = tensor("op_3646_cast_fp16")]; tensor var_3647_to_fp16 = const()[name = tensor("op_3647_to_fp16"), val = tensor(0x1p-3)]; tensor aw_221_cast_fp16 = mul(x = var_3646_cast_fp16, y = var_3647_to_fp16)[name = tensor("aw_221_cast_fp16")]; tensor var_3650_equation_0 = const()[name = tensor("op_3650_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3650_cast_fp16 = einsum(equation = var_3650_equation_0, values = (var_3492_cast_fp16, var_3409_cast_fp16))[name = tensor("op_3650_cast_fp16")]; tensor var_3651_to_fp16 = const()[name = tensor("op_3651_to_fp16"), val = tensor(0x1p-3)]; tensor aw_223_cast_fp16 = mul(x = var_3650_cast_fp16, y = var_3651_to_fp16)[name = tensor("aw_223_cast_fp16")]; tensor var_3654_equation_0 = const()[name = tensor("op_3654_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3654_cast_fp16 = einsum(equation = var_3654_equation_0, values = (var_3496_cast_fp16, var_3413_cast_fp16))[name = tensor("op_3654_cast_fp16")]; tensor var_3655_to_fp16 = const()[name = tensor("op_3655_to_fp16"), val = tensor(0x1p-3)]; tensor aw_225_cast_fp16 = mul(x = var_3654_cast_fp16, y = var_3655_to_fp16)[name = tensor("aw_225_cast_fp16")]; tensor var_3658_equation_0 = const()[name = tensor("op_3658_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3658_cast_fp16 = einsum(equation = var_3658_equation_0, values = (var_3500_cast_fp16, var_3417_cast_fp16))[name = tensor("op_3658_cast_fp16")]; tensor var_3659_to_fp16 = const()[name = tensor("op_3659_to_fp16"), val = tensor(0x1p-3)]; tensor aw_227_cast_fp16 = mul(x = var_3658_cast_fp16, y = var_3659_to_fp16)[name = tensor("aw_227_cast_fp16")]; tensor var_3662_equation_0 = const()[name = tensor("op_3662_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3662_cast_fp16 = einsum(equation = var_3662_equation_0, values = (var_3504_cast_fp16, var_3421_cast_fp16))[name = tensor("op_3662_cast_fp16")]; tensor var_3663_to_fp16 = const()[name = tensor("op_3663_to_fp16"), val = tensor(0x1p-3)]; tensor aw_229_cast_fp16 = mul(x = var_3662_cast_fp16, y = var_3663_to_fp16)[name = tensor("aw_229_cast_fp16")]; tensor var_3666_equation_0 = const()[name = tensor("op_3666_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3666_cast_fp16 = einsum(equation = var_3666_equation_0, values = (var_3508_cast_fp16, var_3425_cast_fp16))[name = tensor("op_3666_cast_fp16")]; tensor var_3667_to_fp16 = const()[name = tensor("op_3667_to_fp16"), val = tensor(0x1p-3)]; tensor aw_231_cast_fp16 = mul(x = var_3666_cast_fp16, y = var_3667_to_fp16)[name = tensor("aw_231_cast_fp16")]; tensor var_3670_equation_0 = const()[name = tensor("op_3670_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3670_cast_fp16 = einsum(equation = var_3670_equation_0, values = (var_3512_cast_fp16, var_3429_cast_fp16))[name = tensor("op_3670_cast_fp16")]; tensor var_3671_to_fp16 = const()[name = tensor("op_3671_to_fp16"), val = tensor(0x1p-3)]; tensor aw_233_cast_fp16 = mul(x = var_3670_cast_fp16, y = var_3671_to_fp16)[name = tensor("aw_233_cast_fp16")]; tensor var_3674_equation_0 = const()[name = tensor("op_3674_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3674_cast_fp16 = einsum(equation = var_3674_equation_0, values = (var_3516_cast_fp16, var_3433_cast_fp16))[name = tensor("op_3674_cast_fp16")]; tensor var_3675_to_fp16 = const()[name = tensor("op_3675_to_fp16"), val = tensor(0x1p-3)]; tensor aw_235_cast_fp16 = mul(x = var_3674_cast_fp16, y = var_3675_to_fp16)[name = tensor("aw_235_cast_fp16")]; tensor var_3678_equation_0 = const()[name = tensor("op_3678_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3678_cast_fp16 = einsum(equation = var_3678_equation_0, values = (var_3520_cast_fp16, var_3437_cast_fp16))[name = tensor("op_3678_cast_fp16")]; tensor var_3679_to_fp16 = const()[name = tensor("op_3679_to_fp16"), val = tensor(0x1p-3)]; tensor aw_237_cast_fp16 = mul(x = var_3678_cast_fp16, y = var_3679_to_fp16)[name = tensor("aw_237_cast_fp16")]; tensor var_3682_equation_0 = const()[name = tensor("op_3682_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_3682_cast_fp16 = einsum(equation = var_3682_equation_0, values = (var_3524_cast_fp16, var_3441_cast_fp16))[name = tensor("op_3682_cast_fp16")]; tensor var_3683_to_fp16 = const()[name = tensor("op_3683_to_fp16"), val = tensor(0x1p-3)]; tensor aw_239_cast_fp16 = mul(x = var_3682_cast_fp16, y = var_3683_to_fp16)[name = tensor("aw_239_cast_fp16")]; tensor var_3685_cast_fp16 = softmax(axis = var_2254, x = aw_201_cast_fp16)[name = tensor("op_3685_cast_fp16")]; tensor var_3686_cast_fp16 = softmax(axis = var_2254, x = aw_203_cast_fp16)[name = tensor("op_3686_cast_fp16")]; tensor var_3687_cast_fp16 = softmax(axis = var_2254, x = aw_205_cast_fp16)[name = tensor("op_3687_cast_fp16")]; tensor var_3688_cast_fp16 = softmax(axis = var_2254, x = aw_207_cast_fp16)[name = tensor("op_3688_cast_fp16")]; tensor var_3689_cast_fp16 = softmax(axis = var_2254, x = aw_209_cast_fp16)[name = tensor("op_3689_cast_fp16")]; tensor var_3690_cast_fp16 = softmax(axis = var_2254, x = aw_211_cast_fp16)[name = tensor("op_3690_cast_fp16")]; tensor var_3691_cast_fp16 = softmax(axis = var_2254, x = aw_213_cast_fp16)[name = tensor("op_3691_cast_fp16")]; tensor var_3692_cast_fp16 = softmax(axis = var_2254, x = aw_215_cast_fp16)[name = tensor("op_3692_cast_fp16")]; tensor var_3693_cast_fp16 = softmax(axis = var_2254, x = aw_217_cast_fp16)[name = tensor("op_3693_cast_fp16")]; tensor var_3694_cast_fp16 = softmax(axis = var_2254, x = aw_219_cast_fp16)[name = tensor("op_3694_cast_fp16")]; tensor var_3695_cast_fp16 = softmax(axis = var_2254, x = aw_221_cast_fp16)[name = tensor("op_3695_cast_fp16")]; tensor var_3696_cast_fp16 = softmax(axis = var_2254, x = aw_223_cast_fp16)[name = tensor("op_3696_cast_fp16")]; tensor var_3697_cast_fp16 = softmax(axis = var_2254, x = aw_225_cast_fp16)[name = tensor("op_3697_cast_fp16")]; tensor var_3698_cast_fp16 = softmax(axis = var_2254, x = aw_227_cast_fp16)[name = tensor("op_3698_cast_fp16")]; tensor var_3699_cast_fp16 = softmax(axis = var_2254, x = aw_229_cast_fp16)[name = tensor("op_3699_cast_fp16")]; tensor var_3700_cast_fp16 = softmax(axis = var_2254, x = aw_231_cast_fp16)[name = tensor("op_3700_cast_fp16")]; tensor var_3701_cast_fp16 = softmax(axis = var_2254, x = aw_233_cast_fp16)[name = tensor("op_3701_cast_fp16")]; tensor var_3702_cast_fp16 = softmax(axis = var_2254, x = aw_235_cast_fp16)[name = tensor("op_3702_cast_fp16")]; tensor var_3703_cast_fp16 = softmax(axis = var_2254, x = aw_237_cast_fp16)[name = tensor("op_3703_cast_fp16")]; tensor var_3704_cast_fp16 = softmax(axis = var_2254, x = aw_239_cast_fp16)[name = tensor("op_3704_cast_fp16")]; tensor var_3706_equation_0 = const()[name = tensor("op_3706_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3706_cast_fp16 = einsum(equation = var_3706_equation_0, values = (var_3526_cast_fp16, var_3685_cast_fp16))[name = tensor("op_3706_cast_fp16")]; tensor var_3708_equation_0 = const()[name = tensor("op_3708_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3708_cast_fp16 = einsum(equation = var_3708_equation_0, values = (var_3530_cast_fp16, var_3686_cast_fp16))[name = tensor("op_3708_cast_fp16")]; tensor var_3710_equation_0 = const()[name = tensor("op_3710_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3710_cast_fp16 = einsum(equation = var_3710_equation_0, values = (var_3534_cast_fp16, var_3687_cast_fp16))[name = tensor("op_3710_cast_fp16")]; tensor var_3712_equation_0 = const()[name = tensor("op_3712_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3712_cast_fp16 = einsum(equation = var_3712_equation_0, values = (var_3538_cast_fp16, var_3688_cast_fp16))[name = tensor("op_3712_cast_fp16")]; tensor var_3714_equation_0 = const()[name = tensor("op_3714_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3714_cast_fp16 = einsum(equation = var_3714_equation_0, values = (var_3542_cast_fp16, var_3689_cast_fp16))[name = tensor("op_3714_cast_fp16")]; tensor var_3716_equation_0 = const()[name = tensor("op_3716_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3716_cast_fp16 = einsum(equation = var_3716_equation_0, values = (var_3546_cast_fp16, var_3690_cast_fp16))[name = tensor("op_3716_cast_fp16")]; tensor var_3718_equation_0 = const()[name = tensor("op_3718_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3718_cast_fp16 = einsum(equation = var_3718_equation_0, values = (var_3550_cast_fp16, var_3691_cast_fp16))[name = tensor("op_3718_cast_fp16")]; tensor var_3720_equation_0 = const()[name = tensor("op_3720_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3720_cast_fp16 = einsum(equation = var_3720_equation_0, values = (var_3554_cast_fp16, var_3692_cast_fp16))[name = tensor("op_3720_cast_fp16")]; tensor var_3722_equation_0 = const()[name = tensor("op_3722_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3722_cast_fp16 = einsum(equation = var_3722_equation_0, values = (var_3558_cast_fp16, var_3693_cast_fp16))[name = tensor("op_3722_cast_fp16")]; tensor var_3724_equation_0 = const()[name = tensor("op_3724_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3724_cast_fp16 = einsum(equation = var_3724_equation_0, values = (var_3562_cast_fp16, var_3694_cast_fp16))[name = tensor("op_3724_cast_fp16")]; tensor var_3726_equation_0 = const()[name = tensor("op_3726_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3726_cast_fp16 = einsum(equation = var_3726_equation_0, values = (var_3566_cast_fp16, var_3695_cast_fp16))[name = tensor("op_3726_cast_fp16")]; tensor var_3728_equation_0 = const()[name = tensor("op_3728_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3728_cast_fp16 = einsum(equation = var_3728_equation_0, values = (var_3570_cast_fp16, var_3696_cast_fp16))[name = tensor("op_3728_cast_fp16")]; tensor var_3730_equation_0 = const()[name = tensor("op_3730_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3730_cast_fp16 = einsum(equation = var_3730_equation_0, values = (var_3574_cast_fp16, var_3697_cast_fp16))[name = tensor("op_3730_cast_fp16")]; tensor var_3732_equation_0 = const()[name = tensor("op_3732_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3732_cast_fp16 = einsum(equation = var_3732_equation_0, values = (var_3578_cast_fp16, var_3698_cast_fp16))[name = tensor("op_3732_cast_fp16")]; tensor var_3734_equation_0 = const()[name = tensor("op_3734_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3734_cast_fp16 = einsum(equation = var_3734_equation_0, values = (var_3582_cast_fp16, var_3699_cast_fp16))[name = tensor("op_3734_cast_fp16")]; tensor var_3736_equation_0 = const()[name = tensor("op_3736_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3736_cast_fp16 = einsum(equation = var_3736_equation_0, values = (var_3586_cast_fp16, var_3700_cast_fp16))[name = tensor("op_3736_cast_fp16")]; tensor var_3738_equation_0 = const()[name = tensor("op_3738_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3738_cast_fp16 = einsum(equation = var_3738_equation_0, values = (var_3590_cast_fp16, var_3701_cast_fp16))[name = tensor("op_3738_cast_fp16")]; tensor var_3740_equation_0 = const()[name = tensor("op_3740_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3740_cast_fp16 = einsum(equation = var_3740_equation_0, values = (var_3594_cast_fp16, var_3702_cast_fp16))[name = tensor("op_3740_cast_fp16")]; tensor var_3742_equation_0 = const()[name = tensor("op_3742_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3742_cast_fp16 = einsum(equation = var_3742_equation_0, values = (var_3598_cast_fp16, var_3703_cast_fp16))[name = tensor("op_3742_cast_fp16")]; tensor var_3744_equation_0 = const()[name = tensor("op_3744_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_3744_cast_fp16 = einsum(equation = var_3744_equation_0, values = (var_3602_cast_fp16, var_3704_cast_fp16))[name = tensor("op_3744_cast_fp16")]; tensor input_159_interleave_0 = const()[name = tensor("input_159_interleave_0"), val = tensor(false)]; tensor input_159_cast_fp16 = concat(axis = var_2254, interleave = input_159_interleave_0, values = (var_3706_cast_fp16, var_3708_cast_fp16, var_3710_cast_fp16, var_3712_cast_fp16, var_3714_cast_fp16, var_3716_cast_fp16, var_3718_cast_fp16, var_3720_cast_fp16, var_3722_cast_fp16, var_3724_cast_fp16, var_3726_cast_fp16, var_3728_cast_fp16, var_3730_cast_fp16, var_3732_cast_fp16, var_3734_cast_fp16, var_3736_cast_fp16, var_3738_cast_fp16, var_3740_cast_fp16, var_3742_cast_fp16, var_3744_cast_fp16))[name = tensor("input_159_cast_fp16")]; tensor var_3750 = const()[name = tensor("op_3750"), val = tensor([1, 1])]; tensor var_3752 = const()[name = tensor("op_3752"), val = tensor([1, 1])]; tensor var_3754_pad_type_0 = const()[name = tensor("op_3754_pad_type_0"), val = tensor("custom")]; tensor var_3754_pad_0 = const()[name = tensor("op_3754_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(296200064)))]; tensor down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299476928)))]; tensor var_3754_cast_fp16 = conv(bias = down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_3752, groups = var_2254, pad = var_3754_pad_0, pad_type = var_3754_pad_type_0, strides = var_3750, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_159_cast_fp16)[name = tensor("op_3754_cast_fp16")]; tensor inputs_33_cast_fp16 = add(x = var_3754_cast_fp16, y = inputs_31_cast_fp16)[name = tensor("inputs_33_cast_fp16")]; tensor var_3758 = const()[name = tensor("op_3758"), val = tensor([1])]; tensor channels_mean_33_cast_fp16 = reduce_mean(axes = var_3758, keep_dims = var_2249, x = inputs_33_cast_fp16)[name = tensor("channels_mean_33_cast_fp16")]; tensor zero_mean_33_cast_fp16 = sub(x = inputs_33_cast_fp16, y = channels_mean_33_cast_fp16)[name = tensor("zero_mean_33_cast_fp16")]; tensor zero_mean_sq_33_cast_fp16 = mul(x = zero_mean_33_cast_fp16, y = zero_mean_33_cast_fp16)[name = tensor("zero_mean_sq_33_cast_fp16")]; tensor var_3762 = const()[name = tensor("op_3762"), val = tensor([1])]; tensor var_3763_cast_fp16 = reduce_mean(axes = var_3762, keep_dims = var_2249, x = zero_mean_sq_33_cast_fp16)[name = tensor("op_3763_cast_fp16")]; tensor var_3764_to_fp16 = const()[name = tensor("op_3764_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_3765_cast_fp16 = add(x = var_3763_cast_fp16, y = var_3764_to_fp16)[name = tensor("op_3765_cast_fp16")]; tensor denom_33_epsilon_0_to_fp16 = const()[name = tensor("denom_33_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_33_cast_fp16 = rsqrt(epsilon = denom_33_epsilon_0_to_fp16, x = var_3765_cast_fp16)[name = tensor("denom_33_cast_fp16")]; tensor out_33_cast_fp16 = mul(x = zero_mean_33_cast_fp16, y = denom_33_cast_fp16)[name = tensor("out_33_cast_fp16")]; tensor var_3769_to_fp16 = const()[name = tensor("op_3769_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299479552)))]; tensor var_3770_cast_fp16 = add(x = out_33_cast_fp16, y = var_3769_to_fp16)[name = tensor("op_3770_cast_fp16")]; tensor var_3772_to_fp16 = const()[name = tensor("op_3772_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299482176)))]; tensor hidden_states_101_cast_fp16 = mul(x = var_3770_cast_fp16, y = var_3772_to_fp16)[name = tensor("hidden_states_101_cast_fp16")]; tensor var_3779 = const()[name = tensor("op_3779"), val = tensor([1, 1])]; tensor var_3781 = const()[name = tensor("op_3781"), val = tensor([1, 1])]; tensor q_23_pad_type_0 = const()[name = tensor("q_23_pad_type_0"), val = tensor("custom")]; tensor q_23_pad_0 = const()[name = tensor("q_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(299484800)))]; tensor q_23_cast_fp16 = conv(dilations = var_3781, groups = var_2254, pad = q_23_pad_0, pad_type = q_23_pad_type_0, strides = var_3779, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_101_cast_fp16)[name = tensor("q_23_cast_fp16")]; tensor var_3785 = const()[name = tensor("op_3785"), val = tensor([1, 1])]; tensor var_3787 = const()[name = tensor("op_3787"), val = tensor([1, 1])]; tensor k_45_pad_type_0 = const()[name = tensor("k_45_pad_type_0"), val = tensor("custom")]; tensor k_45_pad_0 = const()[name = tensor("k_45_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(302761664)))]; tensor k_45_cast_fp16 = conv(dilations = var_3787, groups = var_2254, pad = k_45_pad_0, pad_type = k_45_pad_type_0, strides = var_3785, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_45_cast_fp16")]; tensor var_3791 = const()[name = tensor("op_3791"), val = tensor([1, 1])]; tensor var_3793 = const()[name = tensor("op_3793"), val = tensor([1, 1])]; tensor v_23_pad_type_0 = const()[name = tensor("v_23_pad_type_0"), val = tensor("custom")]; tensor v_23_pad_0 = const()[name = tensor("v_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(305383168)))]; tensor v_23_cast_fp16 = conv(dilations = var_3793, groups = var_2254, pad = v_23_pad_0, pad_type = v_23_pad_type_0, strides = var_3791, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_23_cast_fp16")]; tensor var_3797_begin_0 = const()[name = tensor("op_3797_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_3797_end_0 = const()[name = tensor("op_3797_end_0"), val = tensor([2, 64, 1, 144])]; tensor var_3797_end_mask_0 = const()[name = tensor("op_3797_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3797_cast_fp16 = slice_by_index(begin = var_3797_begin_0, end = var_3797_end_0, end_mask = var_3797_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3797_cast_fp16")]; tensor var_3801_begin_0 = const()[name = tensor("op_3801_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_3801_end_0 = const()[name = tensor("op_3801_end_0"), val = tensor([2, 128, 1, 144])]; tensor var_3801_end_mask_0 = const()[name = tensor("op_3801_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3801_cast_fp16 = slice_by_index(begin = var_3801_begin_0, end = var_3801_end_0, end_mask = var_3801_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3801_cast_fp16")]; tensor var_3805_begin_0 = const()[name = tensor("op_3805_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_3805_end_0 = const()[name = tensor("op_3805_end_0"), val = tensor([2, 192, 1, 144])]; tensor var_3805_end_mask_0 = const()[name = tensor("op_3805_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3805_cast_fp16 = slice_by_index(begin = var_3805_begin_0, end = var_3805_end_0, end_mask = var_3805_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3805_cast_fp16")]; tensor var_3809_begin_0 = const()[name = tensor("op_3809_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_3809_end_0 = const()[name = tensor("op_3809_end_0"), val = tensor([2, 256, 1, 144])]; tensor var_3809_end_mask_0 = const()[name = tensor("op_3809_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3809_cast_fp16 = slice_by_index(begin = var_3809_begin_0, end = var_3809_end_0, end_mask = var_3809_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3809_cast_fp16")]; tensor var_3813_begin_0 = const()[name = tensor("op_3813_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_3813_end_0 = const()[name = tensor("op_3813_end_0"), val = tensor([2, 320, 1, 144])]; tensor var_3813_end_mask_0 = const()[name = tensor("op_3813_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3813_cast_fp16 = slice_by_index(begin = var_3813_begin_0, end = var_3813_end_0, end_mask = var_3813_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3813_cast_fp16")]; tensor var_3817_begin_0 = const()[name = tensor("op_3817_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_3817_end_0 = const()[name = tensor("op_3817_end_0"), val = tensor([2, 384, 1, 144])]; tensor var_3817_end_mask_0 = const()[name = tensor("op_3817_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3817_cast_fp16 = slice_by_index(begin = var_3817_begin_0, end = var_3817_end_0, end_mask = var_3817_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3817_cast_fp16")]; tensor var_3821_begin_0 = const()[name = tensor("op_3821_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_3821_end_0 = const()[name = tensor("op_3821_end_0"), val = tensor([2, 448, 1, 144])]; tensor var_3821_end_mask_0 = const()[name = tensor("op_3821_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3821_cast_fp16 = slice_by_index(begin = var_3821_begin_0, end = var_3821_end_0, end_mask = var_3821_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3821_cast_fp16")]; tensor var_3825_begin_0 = const()[name = tensor("op_3825_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_3825_end_0 = const()[name = tensor("op_3825_end_0"), val = tensor([2, 512, 1, 144])]; tensor var_3825_end_mask_0 = const()[name = tensor("op_3825_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3825_cast_fp16 = slice_by_index(begin = var_3825_begin_0, end = var_3825_end_0, end_mask = var_3825_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3825_cast_fp16")]; tensor var_3829_begin_0 = const()[name = tensor("op_3829_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_3829_end_0 = const()[name = tensor("op_3829_end_0"), val = tensor([2, 576, 1, 144])]; tensor var_3829_end_mask_0 = const()[name = tensor("op_3829_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3829_cast_fp16 = slice_by_index(begin = var_3829_begin_0, end = var_3829_end_0, end_mask = var_3829_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3829_cast_fp16")]; tensor var_3833_begin_0 = const()[name = tensor("op_3833_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_3833_end_0 = const()[name = tensor("op_3833_end_0"), val = tensor([2, 640, 1, 144])]; tensor var_3833_end_mask_0 = const()[name = tensor("op_3833_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3833_cast_fp16 = slice_by_index(begin = var_3833_begin_0, end = var_3833_end_0, end_mask = var_3833_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3833_cast_fp16")]; tensor var_3837_begin_0 = const()[name = tensor("op_3837_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_3837_end_0 = const()[name = tensor("op_3837_end_0"), val = tensor([2, 704, 1, 144])]; tensor var_3837_end_mask_0 = const()[name = tensor("op_3837_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3837_cast_fp16 = slice_by_index(begin = var_3837_begin_0, end = var_3837_end_0, end_mask = var_3837_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3837_cast_fp16")]; tensor var_3841_begin_0 = const()[name = tensor("op_3841_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_3841_end_0 = const()[name = tensor("op_3841_end_0"), val = tensor([2, 768, 1, 144])]; tensor var_3841_end_mask_0 = const()[name = tensor("op_3841_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3841_cast_fp16 = slice_by_index(begin = var_3841_begin_0, end = var_3841_end_0, end_mask = var_3841_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3841_cast_fp16")]; tensor var_3845_begin_0 = const()[name = tensor("op_3845_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_3845_end_0 = const()[name = tensor("op_3845_end_0"), val = tensor([2, 832, 1, 144])]; tensor var_3845_end_mask_0 = const()[name = tensor("op_3845_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3845_cast_fp16 = slice_by_index(begin = var_3845_begin_0, end = var_3845_end_0, end_mask = var_3845_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3845_cast_fp16")]; tensor var_3849_begin_0 = const()[name = tensor("op_3849_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_3849_end_0 = const()[name = tensor("op_3849_end_0"), val = tensor([2, 896, 1, 144])]; tensor var_3849_end_mask_0 = const()[name = tensor("op_3849_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3849_cast_fp16 = slice_by_index(begin = var_3849_begin_0, end = var_3849_end_0, end_mask = var_3849_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3849_cast_fp16")]; tensor var_3853_begin_0 = const()[name = tensor("op_3853_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_3853_end_0 = const()[name = tensor("op_3853_end_0"), val = tensor([2, 960, 1, 144])]; tensor var_3853_end_mask_0 = const()[name = tensor("op_3853_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3853_cast_fp16 = slice_by_index(begin = var_3853_begin_0, end = var_3853_end_0, end_mask = var_3853_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3853_cast_fp16")]; tensor var_3857_begin_0 = const()[name = tensor("op_3857_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_3857_end_0 = const()[name = tensor("op_3857_end_0"), val = tensor([2, 1024, 1, 144])]; tensor var_3857_end_mask_0 = const()[name = tensor("op_3857_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3857_cast_fp16 = slice_by_index(begin = var_3857_begin_0, end = var_3857_end_0, end_mask = var_3857_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3857_cast_fp16")]; tensor var_3861_begin_0 = const()[name = tensor("op_3861_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_3861_end_0 = const()[name = tensor("op_3861_end_0"), val = tensor([2, 1088, 1, 144])]; tensor var_3861_end_mask_0 = const()[name = tensor("op_3861_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3861_cast_fp16 = slice_by_index(begin = var_3861_begin_0, end = var_3861_end_0, end_mask = var_3861_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3861_cast_fp16")]; tensor var_3865_begin_0 = const()[name = tensor("op_3865_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_3865_end_0 = const()[name = tensor("op_3865_end_0"), val = tensor([2, 1152, 1, 144])]; tensor var_3865_end_mask_0 = const()[name = tensor("op_3865_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3865_cast_fp16 = slice_by_index(begin = var_3865_begin_0, end = var_3865_end_0, end_mask = var_3865_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3865_cast_fp16")]; tensor var_3869_begin_0 = const()[name = tensor("op_3869_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_3869_end_0 = const()[name = tensor("op_3869_end_0"), val = tensor([2, 1216, 1, 144])]; tensor var_3869_end_mask_0 = const()[name = tensor("op_3869_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3869_cast_fp16 = slice_by_index(begin = var_3869_begin_0, end = var_3869_end_0, end_mask = var_3869_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3869_cast_fp16")]; tensor var_3873_begin_0 = const()[name = tensor("op_3873_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_3873_end_0 = const()[name = tensor("op_3873_end_0"), val = tensor([2, 1280, 1, 144])]; tensor var_3873_end_mask_0 = const()[name = tensor("op_3873_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3873_cast_fp16 = slice_by_index(begin = var_3873_begin_0, end = var_3873_end_0, end_mask = var_3873_end_mask_0, x = q_23_cast_fp16)[name = tensor("op_3873_cast_fp16")]; tensor k_47_perm_0 = const()[name = tensor("k_47_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_3880_begin_0 = const()[name = tensor("op_3880_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_3880_end_0 = const()[name = tensor("op_3880_end_0"), val = tensor([2, 77, 1, 64])]; tensor var_3880_end_mask_0 = const()[name = tensor("op_3880_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_2 = transpose(perm = k_47_perm_0, x = k_45_cast_fp16)[name = tensor("transpose_2")]; tensor var_3880_cast_fp16 = slice_by_index(begin = var_3880_begin_0, end = var_3880_end_0, end_mask = var_3880_end_mask_0, x = transpose_2)[name = tensor("op_3880_cast_fp16")]; tensor var_3884_begin_0 = const()[name = tensor("op_3884_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_3884_end_0 = const()[name = tensor("op_3884_end_0"), val = tensor([2, 77, 1, 128])]; tensor var_3884_end_mask_0 = const()[name = tensor("op_3884_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3884_cast_fp16 = slice_by_index(begin = var_3884_begin_0, end = var_3884_end_0, end_mask = var_3884_end_mask_0, x = transpose_2)[name = tensor("op_3884_cast_fp16")]; tensor var_3888_begin_0 = const()[name = tensor("op_3888_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_3888_end_0 = const()[name = tensor("op_3888_end_0"), val = tensor([2, 77, 1, 192])]; tensor var_3888_end_mask_0 = const()[name = tensor("op_3888_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3888_cast_fp16 = slice_by_index(begin = var_3888_begin_0, end = var_3888_end_0, end_mask = var_3888_end_mask_0, x = transpose_2)[name = tensor("op_3888_cast_fp16")]; tensor var_3892_begin_0 = const()[name = tensor("op_3892_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_3892_end_0 = const()[name = tensor("op_3892_end_0"), val = tensor([2, 77, 1, 256])]; tensor var_3892_end_mask_0 = const()[name = tensor("op_3892_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3892_cast_fp16 = slice_by_index(begin = var_3892_begin_0, end = var_3892_end_0, end_mask = var_3892_end_mask_0, x = transpose_2)[name = tensor("op_3892_cast_fp16")]; tensor var_3896_begin_0 = const()[name = tensor("op_3896_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_3896_end_0 = const()[name = tensor("op_3896_end_0"), val = tensor([2, 77, 1, 320])]; tensor var_3896_end_mask_0 = const()[name = tensor("op_3896_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3896_cast_fp16 = slice_by_index(begin = var_3896_begin_0, end = var_3896_end_0, end_mask = var_3896_end_mask_0, x = transpose_2)[name = tensor("op_3896_cast_fp16")]; tensor var_3900_begin_0 = const()[name = tensor("op_3900_begin_0"), val = tensor([0, 0, 0, 320])]; tensor var_3900_end_0 = const()[name = tensor("op_3900_end_0"), val = tensor([2, 77, 1, 384])]; tensor var_3900_end_mask_0 = const()[name = tensor("op_3900_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3900_cast_fp16 = slice_by_index(begin = var_3900_begin_0, end = var_3900_end_0, end_mask = var_3900_end_mask_0, x = transpose_2)[name = tensor("op_3900_cast_fp16")]; tensor var_3904_begin_0 = const()[name = tensor("op_3904_begin_0"), val = tensor([0, 0, 0, 384])]; tensor var_3904_end_0 = const()[name = tensor("op_3904_end_0"), val = tensor([2, 77, 1, 448])]; tensor var_3904_end_mask_0 = const()[name = tensor("op_3904_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3904_cast_fp16 = slice_by_index(begin = var_3904_begin_0, end = var_3904_end_0, end_mask = var_3904_end_mask_0, x = transpose_2)[name = tensor("op_3904_cast_fp16")]; tensor var_3908_begin_0 = const()[name = tensor("op_3908_begin_0"), val = tensor([0, 0, 0, 448])]; tensor var_3908_end_0 = const()[name = tensor("op_3908_end_0"), val = tensor([2, 77, 1, 512])]; tensor var_3908_end_mask_0 = const()[name = tensor("op_3908_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3908_cast_fp16 = slice_by_index(begin = var_3908_begin_0, end = var_3908_end_0, end_mask = var_3908_end_mask_0, x = transpose_2)[name = tensor("op_3908_cast_fp16")]; tensor var_3912_begin_0 = const()[name = tensor("op_3912_begin_0"), val = tensor([0, 0, 0, 512])]; tensor var_3912_end_0 = const()[name = tensor("op_3912_end_0"), val = tensor([2, 77, 1, 576])]; tensor var_3912_end_mask_0 = const()[name = tensor("op_3912_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3912_cast_fp16 = slice_by_index(begin = var_3912_begin_0, end = var_3912_end_0, end_mask = var_3912_end_mask_0, x = transpose_2)[name = tensor("op_3912_cast_fp16")]; tensor var_3916_begin_0 = const()[name = tensor("op_3916_begin_0"), val = tensor([0, 0, 0, 576])]; tensor var_3916_end_0 = const()[name = tensor("op_3916_end_0"), val = tensor([2, 77, 1, 640])]; tensor var_3916_end_mask_0 = const()[name = tensor("op_3916_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3916_cast_fp16 = slice_by_index(begin = var_3916_begin_0, end = var_3916_end_0, end_mask = var_3916_end_mask_0, x = transpose_2)[name = tensor("op_3916_cast_fp16")]; tensor var_3920_begin_0 = const()[name = tensor("op_3920_begin_0"), val = tensor([0, 0, 0, 640])]; tensor var_3920_end_0 = const()[name = tensor("op_3920_end_0"), val = tensor([2, 77, 1, 704])]; tensor var_3920_end_mask_0 = const()[name = tensor("op_3920_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3920_cast_fp16 = slice_by_index(begin = var_3920_begin_0, end = var_3920_end_0, end_mask = var_3920_end_mask_0, x = transpose_2)[name = tensor("op_3920_cast_fp16")]; tensor var_3924_begin_0 = const()[name = tensor("op_3924_begin_0"), val = tensor([0, 0, 0, 704])]; tensor var_3924_end_0 = const()[name = tensor("op_3924_end_0"), val = tensor([2, 77, 1, 768])]; tensor var_3924_end_mask_0 = const()[name = tensor("op_3924_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3924_cast_fp16 = slice_by_index(begin = var_3924_begin_0, end = var_3924_end_0, end_mask = var_3924_end_mask_0, x = transpose_2)[name = tensor("op_3924_cast_fp16")]; tensor var_3928_begin_0 = const()[name = tensor("op_3928_begin_0"), val = tensor([0, 0, 0, 768])]; tensor var_3928_end_0 = const()[name = tensor("op_3928_end_0"), val = tensor([2, 77, 1, 832])]; tensor var_3928_end_mask_0 = const()[name = tensor("op_3928_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3928_cast_fp16 = slice_by_index(begin = var_3928_begin_0, end = var_3928_end_0, end_mask = var_3928_end_mask_0, x = transpose_2)[name = tensor("op_3928_cast_fp16")]; tensor var_3932_begin_0 = const()[name = tensor("op_3932_begin_0"), val = tensor([0, 0, 0, 832])]; tensor var_3932_end_0 = const()[name = tensor("op_3932_end_0"), val = tensor([2, 77, 1, 896])]; tensor var_3932_end_mask_0 = const()[name = tensor("op_3932_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3932_cast_fp16 = slice_by_index(begin = var_3932_begin_0, end = var_3932_end_0, end_mask = var_3932_end_mask_0, x = transpose_2)[name = tensor("op_3932_cast_fp16")]; tensor var_3936_begin_0 = const()[name = tensor("op_3936_begin_0"), val = tensor([0, 0, 0, 896])]; tensor var_3936_end_0 = const()[name = tensor("op_3936_end_0"), val = tensor([2, 77, 1, 960])]; tensor var_3936_end_mask_0 = const()[name = tensor("op_3936_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3936_cast_fp16 = slice_by_index(begin = var_3936_begin_0, end = var_3936_end_0, end_mask = var_3936_end_mask_0, x = transpose_2)[name = tensor("op_3936_cast_fp16")]; tensor var_3940_begin_0 = const()[name = tensor("op_3940_begin_0"), val = tensor([0, 0, 0, 960])]; tensor var_3940_end_0 = const()[name = tensor("op_3940_end_0"), val = tensor([2, 77, 1, 1024])]; tensor var_3940_end_mask_0 = const()[name = tensor("op_3940_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3940_cast_fp16 = slice_by_index(begin = var_3940_begin_0, end = var_3940_end_0, end_mask = var_3940_end_mask_0, x = transpose_2)[name = tensor("op_3940_cast_fp16")]; tensor var_3944_begin_0 = const()[name = tensor("op_3944_begin_0"), val = tensor([0, 0, 0, 1024])]; tensor var_3944_end_0 = const()[name = tensor("op_3944_end_0"), val = tensor([2, 77, 1, 1088])]; tensor var_3944_end_mask_0 = const()[name = tensor("op_3944_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3944_cast_fp16 = slice_by_index(begin = var_3944_begin_0, end = var_3944_end_0, end_mask = var_3944_end_mask_0, x = transpose_2)[name = tensor("op_3944_cast_fp16")]; tensor var_3948_begin_0 = const()[name = tensor("op_3948_begin_0"), val = tensor([0, 0, 0, 1088])]; tensor var_3948_end_0 = const()[name = tensor("op_3948_end_0"), val = tensor([2, 77, 1, 1152])]; tensor var_3948_end_mask_0 = const()[name = tensor("op_3948_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3948_cast_fp16 = slice_by_index(begin = var_3948_begin_0, end = var_3948_end_0, end_mask = var_3948_end_mask_0, x = transpose_2)[name = tensor("op_3948_cast_fp16")]; tensor var_3952_begin_0 = const()[name = tensor("op_3952_begin_0"), val = tensor([0, 0, 0, 1152])]; tensor var_3952_end_0 = const()[name = tensor("op_3952_end_0"), val = tensor([2, 77, 1, 1216])]; tensor var_3952_end_mask_0 = const()[name = tensor("op_3952_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3952_cast_fp16 = slice_by_index(begin = var_3952_begin_0, end = var_3952_end_0, end_mask = var_3952_end_mask_0, x = transpose_2)[name = tensor("op_3952_cast_fp16")]; tensor var_3956_begin_0 = const()[name = tensor("op_3956_begin_0"), val = tensor([0, 0, 0, 1216])]; tensor var_3956_end_0 = const()[name = tensor("op_3956_end_0"), val = tensor([2, 77, 1, 1280])]; tensor var_3956_end_mask_0 = const()[name = tensor("op_3956_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_3956_cast_fp16 = slice_by_index(begin = var_3956_begin_0, end = var_3956_end_0, end_mask = var_3956_end_mask_0, x = transpose_2)[name = tensor("op_3956_cast_fp16")]; tensor var_3958_begin_0 = const()[name = tensor("op_3958_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_3958_end_0 = const()[name = tensor("op_3958_end_0"), val = tensor([2, 64, 1, 77])]; tensor var_3958_end_mask_0 = const()[name = tensor("op_3958_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3958_cast_fp16 = slice_by_index(begin = var_3958_begin_0, end = var_3958_end_0, end_mask = var_3958_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3958_cast_fp16")]; tensor var_3962_begin_0 = const()[name = tensor("op_3962_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_3962_end_0 = const()[name = tensor("op_3962_end_0"), val = tensor([2, 128, 1, 77])]; tensor var_3962_end_mask_0 = const()[name = tensor("op_3962_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3962_cast_fp16 = slice_by_index(begin = var_3962_begin_0, end = var_3962_end_0, end_mask = var_3962_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3962_cast_fp16")]; tensor var_3966_begin_0 = const()[name = tensor("op_3966_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_3966_end_0 = const()[name = tensor("op_3966_end_0"), val = tensor([2, 192, 1, 77])]; tensor var_3966_end_mask_0 = const()[name = tensor("op_3966_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3966_cast_fp16 = slice_by_index(begin = var_3966_begin_0, end = var_3966_end_0, end_mask = var_3966_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3966_cast_fp16")]; tensor var_3970_begin_0 = const()[name = tensor("op_3970_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_3970_end_0 = const()[name = tensor("op_3970_end_0"), val = tensor([2, 256, 1, 77])]; tensor var_3970_end_mask_0 = const()[name = tensor("op_3970_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3970_cast_fp16 = slice_by_index(begin = var_3970_begin_0, end = var_3970_end_0, end_mask = var_3970_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3970_cast_fp16")]; tensor var_3974_begin_0 = const()[name = tensor("op_3974_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_3974_end_0 = const()[name = tensor("op_3974_end_0"), val = tensor([2, 320, 1, 77])]; tensor var_3974_end_mask_0 = const()[name = tensor("op_3974_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3974_cast_fp16 = slice_by_index(begin = var_3974_begin_0, end = var_3974_end_0, end_mask = var_3974_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3974_cast_fp16")]; tensor var_3978_begin_0 = const()[name = tensor("op_3978_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_3978_end_0 = const()[name = tensor("op_3978_end_0"), val = tensor([2, 384, 1, 77])]; tensor var_3978_end_mask_0 = const()[name = tensor("op_3978_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3978_cast_fp16 = slice_by_index(begin = var_3978_begin_0, end = var_3978_end_0, end_mask = var_3978_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3978_cast_fp16")]; tensor var_3982_begin_0 = const()[name = tensor("op_3982_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_3982_end_0 = const()[name = tensor("op_3982_end_0"), val = tensor([2, 448, 1, 77])]; tensor var_3982_end_mask_0 = const()[name = tensor("op_3982_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3982_cast_fp16 = slice_by_index(begin = var_3982_begin_0, end = var_3982_end_0, end_mask = var_3982_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3982_cast_fp16")]; tensor var_3986_begin_0 = const()[name = tensor("op_3986_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_3986_end_0 = const()[name = tensor("op_3986_end_0"), val = tensor([2, 512, 1, 77])]; tensor var_3986_end_mask_0 = const()[name = tensor("op_3986_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3986_cast_fp16 = slice_by_index(begin = var_3986_begin_0, end = var_3986_end_0, end_mask = var_3986_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3986_cast_fp16")]; tensor var_3990_begin_0 = const()[name = tensor("op_3990_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_3990_end_0 = const()[name = tensor("op_3990_end_0"), val = tensor([2, 576, 1, 77])]; tensor var_3990_end_mask_0 = const()[name = tensor("op_3990_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3990_cast_fp16 = slice_by_index(begin = var_3990_begin_0, end = var_3990_end_0, end_mask = var_3990_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3990_cast_fp16")]; tensor var_3994_begin_0 = const()[name = tensor("op_3994_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_3994_end_0 = const()[name = tensor("op_3994_end_0"), val = tensor([2, 640, 1, 77])]; tensor var_3994_end_mask_0 = const()[name = tensor("op_3994_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3994_cast_fp16 = slice_by_index(begin = var_3994_begin_0, end = var_3994_end_0, end_mask = var_3994_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3994_cast_fp16")]; tensor var_3998_begin_0 = const()[name = tensor("op_3998_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_3998_end_0 = const()[name = tensor("op_3998_end_0"), val = tensor([2, 704, 1, 77])]; tensor var_3998_end_mask_0 = const()[name = tensor("op_3998_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_3998_cast_fp16 = slice_by_index(begin = var_3998_begin_0, end = var_3998_end_0, end_mask = var_3998_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_3998_cast_fp16")]; tensor var_4002_begin_0 = const()[name = tensor("op_4002_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_4002_end_0 = const()[name = tensor("op_4002_end_0"), val = tensor([2, 768, 1, 77])]; tensor var_4002_end_mask_0 = const()[name = tensor("op_4002_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4002_cast_fp16 = slice_by_index(begin = var_4002_begin_0, end = var_4002_end_0, end_mask = var_4002_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4002_cast_fp16")]; tensor var_4006_begin_0 = const()[name = tensor("op_4006_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_4006_end_0 = const()[name = tensor("op_4006_end_0"), val = tensor([2, 832, 1, 77])]; tensor var_4006_end_mask_0 = const()[name = tensor("op_4006_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4006_cast_fp16 = slice_by_index(begin = var_4006_begin_0, end = var_4006_end_0, end_mask = var_4006_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4006_cast_fp16")]; tensor var_4010_begin_0 = const()[name = tensor("op_4010_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_4010_end_0 = const()[name = tensor("op_4010_end_0"), val = tensor([2, 896, 1, 77])]; tensor var_4010_end_mask_0 = const()[name = tensor("op_4010_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4010_cast_fp16 = slice_by_index(begin = var_4010_begin_0, end = var_4010_end_0, end_mask = var_4010_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4010_cast_fp16")]; tensor var_4014_begin_0 = const()[name = tensor("op_4014_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_4014_end_0 = const()[name = tensor("op_4014_end_0"), val = tensor([2, 960, 1, 77])]; tensor var_4014_end_mask_0 = const()[name = tensor("op_4014_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4014_cast_fp16 = slice_by_index(begin = var_4014_begin_0, end = var_4014_end_0, end_mask = var_4014_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4014_cast_fp16")]; tensor var_4018_begin_0 = const()[name = tensor("op_4018_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_4018_end_0 = const()[name = tensor("op_4018_end_0"), val = tensor([2, 1024, 1, 77])]; tensor var_4018_end_mask_0 = const()[name = tensor("op_4018_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4018_cast_fp16 = slice_by_index(begin = var_4018_begin_0, end = var_4018_end_0, end_mask = var_4018_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4018_cast_fp16")]; tensor var_4022_begin_0 = const()[name = tensor("op_4022_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_4022_end_0 = const()[name = tensor("op_4022_end_0"), val = tensor([2, 1088, 1, 77])]; tensor var_4022_end_mask_0 = const()[name = tensor("op_4022_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4022_cast_fp16 = slice_by_index(begin = var_4022_begin_0, end = var_4022_end_0, end_mask = var_4022_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4022_cast_fp16")]; tensor var_4026_begin_0 = const()[name = tensor("op_4026_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_4026_end_0 = const()[name = tensor("op_4026_end_0"), val = tensor([2, 1152, 1, 77])]; tensor var_4026_end_mask_0 = const()[name = tensor("op_4026_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4026_cast_fp16 = slice_by_index(begin = var_4026_begin_0, end = var_4026_end_0, end_mask = var_4026_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4026_cast_fp16")]; tensor var_4030_begin_0 = const()[name = tensor("op_4030_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_4030_end_0 = const()[name = tensor("op_4030_end_0"), val = tensor([2, 1216, 1, 77])]; tensor var_4030_end_mask_0 = const()[name = tensor("op_4030_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4030_cast_fp16 = slice_by_index(begin = var_4030_begin_0, end = var_4030_end_0, end_mask = var_4030_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4030_cast_fp16")]; tensor var_4034_begin_0 = const()[name = tensor("op_4034_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_4034_end_0 = const()[name = tensor("op_4034_end_0"), val = tensor([2, 1280, 1, 77])]; tensor var_4034_end_mask_0 = const()[name = tensor("op_4034_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4034_cast_fp16 = slice_by_index(begin = var_4034_begin_0, end = var_4034_end_0, end_mask = var_4034_end_mask_0, x = v_23_cast_fp16)[name = tensor("op_4034_cast_fp16")]; tensor var_4038_equation_0 = const()[name = tensor("op_4038_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4038_cast_fp16 = einsum(equation = var_4038_equation_0, values = (var_3880_cast_fp16, var_3797_cast_fp16))[name = tensor("op_4038_cast_fp16")]; tensor var_4039_to_fp16 = const()[name = tensor("op_4039_to_fp16"), val = tensor(0x1p-3)]; tensor aw_241_cast_fp16 = mul(x = var_4038_cast_fp16, y = var_4039_to_fp16)[name = tensor("aw_241_cast_fp16")]; tensor var_4042_equation_0 = const()[name = tensor("op_4042_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4042_cast_fp16 = einsum(equation = var_4042_equation_0, values = (var_3884_cast_fp16, var_3801_cast_fp16))[name = tensor("op_4042_cast_fp16")]; tensor var_4043_to_fp16 = const()[name = tensor("op_4043_to_fp16"), val = tensor(0x1p-3)]; tensor aw_243_cast_fp16 = mul(x = var_4042_cast_fp16, y = var_4043_to_fp16)[name = tensor("aw_243_cast_fp16")]; tensor var_4046_equation_0 = const()[name = tensor("op_4046_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4046_cast_fp16 = einsum(equation = var_4046_equation_0, values = (var_3888_cast_fp16, var_3805_cast_fp16))[name = tensor("op_4046_cast_fp16")]; tensor var_4047_to_fp16 = const()[name = tensor("op_4047_to_fp16"), val = tensor(0x1p-3)]; tensor aw_245_cast_fp16 = mul(x = var_4046_cast_fp16, y = var_4047_to_fp16)[name = tensor("aw_245_cast_fp16")]; tensor var_4050_equation_0 = const()[name = tensor("op_4050_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4050_cast_fp16 = einsum(equation = var_4050_equation_0, values = (var_3892_cast_fp16, var_3809_cast_fp16))[name = tensor("op_4050_cast_fp16")]; tensor var_4051_to_fp16 = const()[name = tensor("op_4051_to_fp16"), val = tensor(0x1p-3)]; tensor aw_247_cast_fp16 = mul(x = var_4050_cast_fp16, y = var_4051_to_fp16)[name = tensor("aw_247_cast_fp16")]; tensor var_4054_equation_0 = const()[name = tensor("op_4054_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4054_cast_fp16 = einsum(equation = var_4054_equation_0, values = (var_3896_cast_fp16, var_3813_cast_fp16))[name = tensor("op_4054_cast_fp16")]; tensor var_4055_to_fp16 = const()[name = tensor("op_4055_to_fp16"), val = tensor(0x1p-3)]; tensor aw_249_cast_fp16 = mul(x = var_4054_cast_fp16, y = var_4055_to_fp16)[name = tensor("aw_249_cast_fp16")]; tensor var_4058_equation_0 = const()[name = tensor("op_4058_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4058_cast_fp16 = einsum(equation = var_4058_equation_0, values = (var_3900_cast_fp16, var_3817_cast_fp16))[name = tensor("op_4058_cast_fp16")]; tensor var_4059_to_fp16 = const()[name = tensor("op_4059_to_fp16"), val = tensor(0x1p-3)]; tensor aw_251_cast_fp16 = mul(x = var_4058_cast_fp16, y = var_4059_to_fp16)[name = tensor("aw_251_cast_fp16")]; tensor var_4062_equation_0 = const()[name = tensor("op_4062_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4062_cast_fp16 = einsum(equation = var_4062_equation_0, values = (var_3904_cast_fp16, var_3821_cast_fp16))[name = tensor("op_4062_cast_fp16")]; tensor var_4063_to_fp16 = const()[name = tensor("op_4063_to_fp16"), val = tensor(0x1p-3)]; tensor aw_253_cast_fp16 = mul(x = var_4062_cast_fp16, y = var_4063_to_fp16)[name = tensor("aw_253_cast_fp16")]; tensor var_4066_equation_0 = const()[name = tensor("op_4066_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4066_cast_fp16 = einsum(equation = var_4066_equation_0, values = (var_3908_cast_fp16, var_3825_cast_fp16))[name = tensor("op_4066_cast_fp16")]; tensor var_4067_to_fp16 = const()[name = tensor("op_4067_to_fp16"), val = tensor(0x1p-3)]; tensor aw_255_cast_fp16 = mul(x = var_4066_cast_fp16, y = var_4067_to_fp16)[name = tensor("aw_255_cast_fp16")]; tensor var_4070_equation_0 = const()[name = tensor("op_4070_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4070_cast_fp16 = einsum(equation = var_4070_equation_0, values = (var_3912_cast_fp16, var_3829_cast_fp16))[name = tensor("op_4070_cast_fp16")]; tensor var_4071_to_fp16 = const()[name = tensor("op_4071_to_fp16"), val = tensor(0x1p-3)]; tensor aw_257_cast_fp16 = mul(x = var_4070_cast_fp16, y = var_4071_to_fp16)[name = tensor("aw_257_cast_fp16")]; tensor var_4074_equation_0 = const()[name = tensor("op_4074_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4074_cast_fp16 = einsum(equation = var_4074_equation_0, values = (var_3916_cast_fp16, var_3833_cast_fp16))[name = tensor("op_4074_cast_fp16")]; tensor var_4075_to_fp16 = const()[name = tensor("op_4075_to_fp16"), val = tensor(0x1p-3)]; tensor aw_259_cast_fp16 = mul(x = var_4074_cast_fp16, y = var_4075_to_fp16)[name = tensor("aw_259_cast_fp16")]; tensor var_4078_equation_0 = const()[name = tensor("op_4078_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4078_cast_fp16 = einsum(equation = var_4078_equation_0, values = (var_3920_cast_fp16, var_3837_cast_fp16))[name = tensor("op_4078_cast_fp16")]; tensor var_4079_to_fp16 = const()[name = tensor("op_4079_to_fp16"), val = tensor(0x1p-3)]; tensor aw_261_cast_fp16 = mul(x = var_4078_cast_fp16, y = var_4079_to_fp16)[name = tensor("aw_261_cast_fp16")]; tensor var_4082_equation_0 = const()[name = tensor("op_4082_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4082_cast_fp16 = einsum(equation = var_4082_equation_0, values = (var_3924_cast_fp16, var_3841_cast_fp16))[name = tensor("op_4082_cast_fp16")]; tensor var_4083_to_fp16 = const()[name = tensor("op_4083_to_fp16"), val = tensor(0x1p-3)]; tensor aw_263_cast_fp16 = mul(x = var_4082_cast_fp16, y = var_4083_to_fp16)[name = tensor("aw_263_cast_fp16")]; tensor var_4086_equation_0 = const()[name = tensor("op_4086_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4086_cast_fp16 = einsum(equation = var_4086_equation_0, values = (var_3928_cast_fp16, var_3845_cast_fp16))[name = tensor("op_4086_cast_fp16")]; tensor var_4087_to_fp16 = const()[name = tensor("op_4087_to_fp16"), val = tensor(0x1p-3)]; tensor aw_265_cast_fp16 = mul(x = var_4086_cast_fp16, y = var_4087_to_fp16)[name = tensor("aw_265_cast_fp16")]; tensor var_4090_equation_0 = const()[name = tensor("op_4090_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4090_cast_fp16 = einsum(equation = var_4090_equation_0, values = (var_3932_cast_fp16, var_3849_cast_fp16))[name = tensor("op_4090_cast_fp16")]; tensor var_4091_to_fp16 = const()[name = tensor("op_4091_to_fp16"), val = tensor(0x1p-3)]; tensor aw_267_cast_fp16 = mul(x = var_4090_cast_fp16, y = var_4091_to_fp16)[name = tensor("aw_267_cast_fp16")]; tensor var_4094_equation_0 = const()[name = tensor("op_4094_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4094_cast_fp16 = einsum(equation = var_4094_equation_0, values = (var_3936_cast_fp16, var_3853_cast_fp16))[name = tensor("op_4094_cast_fp16")]; tensor var_4095_to_fp16 = const()[name = tensor("op_4095_to_fp16"), val = tensor(0x1p-3)]; tensor aw_269_cast_fp16 = mul(x = var_4094_cast_fp16, y = var_4095_to_fp16)[name = tensor("aw_269_cast_fp16")]; tensor var_4098_equation_0 = const()[name = tensor("op_4098_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4098_cast_fp16 = einsum(equation = var_4098_equation_0, values = (var_3940_cast_fp16, var_3857_cast_fp16))[name = tensor("op_4098_cast_fp16")]; tensor var_4099_to_fp16 = const()[name = tensor("op_4099_to_fp16"), val = tensor(0x1p-3)]; tensor aw_271_cast_fp16 = mul(x = var_4098_cast_fp16, y = var_4099_to_fp16)[name = tensor("aw_271_cast_fp16")]; tensor var_4102_equation_0 = const()[name = tensor("op_4102_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4102_cast_fp16 = einsum(equation = var_4102_equation_0, values = (var_3944_cast_fp16, var_3861_cast_fp16))[name = tensor("op_4102_cast_fp16")]; tensor var_4103_to_fp16 = const()[name = tensor("op_4103_to_fp16"), val = tensor(0x1p-3)]; tensor aw_273_cast_fp16 = mul(x = var_4102_cast_fp16, y = var_4103_to_fp16)[name = tensor("aw_273_cast_fp16")]; tensor var_4106_equation_0 = const()[name = tensor("op_4106_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4106_cast_fp16 = einsum(equation = var_4106_equation_0, values = (var_3948_cast_fp16, var_3865_cast_fp16))[name = tensor("op_4106_cast_fp16")]; tensor var_4107_to_fp16 = const()[name = tensor("op_4107_to_fp16"), val = tensor(0x1p-3)]; tensor aw_275_cast_fp16 = mul(x = var_4106_cast_fp16, y = var_4107_to_fp16)[name = tensor("aw_275_cast_fp16")]; tensor var_4110_equation_0 = const()[name = tensor("op_4110_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4110_cast_fp16 = einsum(equation = var_4110_equation_0, values = (var_3952_cast_fp16, var_3869_cast_fp16))[name = tensor("op_4110_cast_fp16")]; tensor var_4111_to_fp16 = const()[name = tensor("op_4111_to_fp16"), val = tensor(0x1p-3)]; tensor aw_277_cast_fp16 = mul(x = var_4110_cast_fp16, y = var_4111_to_fp16)[name = tensor("aw_277_cast_fp16")]; tensor var_4114_equation_0 = const()[name = tensor("op_4114_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4114_cast_fp16 = einsum(equation = var_4114_equation_0, values = (var_3956_cast_fp16, var_3873_cast_fp16))[name = tensor("op_4114_cast_fp16")]; tensor var_4115_to_fp16 = const()[name = tensor("op_4115_to_fp16"), val = tensor(0x1p-3)]; tensor aw_279_cast_fp16 = mul(x = var_4114_cast_fp16, y = var_4115_to_fp16)[name = tensor("aw_279_cast_fp16")]; tensor var_4117_cast_fp16 = softmax(axis = var_2254, x = aw_241_cast_fp16)[name = tensor("op_4117_cast_fp16")]; tensor var_4118_cast_fp16 = softmax(axis = var_2254, x = aw_243_cast_fp16)[name = tensor("op_4118_cast_fp16")]; tensor var_4119_cast_fp16 = softmax(axis = var_2254, x = aw_245_cast_fp16)[name = tensor("op_4119_cast_fp16")]; tensor var_4120_cast_fp16 = softmax(axis = var_2254, x = aw_247_cast_fp16)[name = tensor("op_4120_cast_fp16")]; tensor var_4121_cast_fp16 = softmax(axis = var_2254, x = aw_249_cast_fp16)[name = tensor("op_4121_cast_fp16")]; tensor var_4122_cast_fp16 = softmax(axis = var_2254, x = aw_251_cast_fp16)[name = tensor("op_4122_cast_fp16")]; tensor var_4123_cast_fp16 = softmax(axis = var_2254, x = aw_253_cast_fp16)[name = tensor("op_4123_cast_fp16")]; tensor var_4124_cast_fp16 = softmax(axis = var_2254, x = aw_255_cast_fp16)[name = tensor("op_4124_cast_fp16")]; tensor var_4125_cast_fp16 = softmax(axis = var_2254, x = aw_257_cast_fp16)[name = tensor("op_4125_cast_fp16")]; tensor var_4126_cast_fp16 = softmax(axis = var_2254, x = aw_259_cast_fp16)[name = tensor("op_4126_cast_fp16")]; tensor var_4127_cast_fp16 = softmax(axis = var_2254, x = aw_261_cast_fp16)[name = tensor("op_4127_cast_fp16")]; tensor var_4128_cast_fp16 = softmax(axis = var_2254, x = aw_263_cast_fp16)[name = tensor("op_4128_cast_fp16")]; tensor var_4129_cast_fp16 = softmax(axis = var_2254, x = aw_265_cast_fp16)[name = tensor("op_4129_cast_fp16")]; tensor var_4130_cast_fp16 = softmax(axis = var_2254, x = aw_267_cast_fp16)[name = tensor("op_4130_cast_fp16")]; tensor var_4131_cast_fp16 = softmax(axis = var_2254, x = aw_269_cast_fp16)[name = tensor("op_4131_cast_fp16")]; tensor var_4132_cast_fp16 = softmax(axis = var_2254, x = aw_271_cast_fp16)[name = tensor("op_4132_cast_fp16")]; tensor var_4133_cast_fp16 = softmax(axis = var_2254, x = aw_273_cast_fp16)[name = tensor("op_4133_cast_fp16")]; tensor var_4134_cast_fp16 = softmax(axis = var_2254, x = aw_275_cast_fp16)[name = tensor("op_4134_cast_fp16")]; tensor var_4135_cast_fp16 = softmax(axis = var_2254, x = aw_277_cast_fp16)[name = tensor("op_4135_cast_fp16")]; tensor var_4136_cast_fp16 = softmax(axis = var_2254, x = aw_279_cast_fp16)[name = tensor("op_4136_cast_fp16")]; tensor var_4138_equation_0 = const()[name = tensor("op_4138_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4138_cast_fp16 = einsum(equation = var_4138_equation_0, values = (var_3958_cast_fp16, var_4117_cast_fp16))[name = tensor("op_4138_cast_fp16")]; tensor var_4140_equation_0 = const()[name = tensor("op_4140_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4140_cast_fp16 = einsum(equation = var_4140_equation_0, values = (var_3962_cast_fp16, var_4118_cast_fp16))[name = tensor("op_4140_cast_fp16")]; tensor var_4142_equation_0 = const()[name = tensor("op_4142_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4142_cast_fp16 = einsum(equation = var_4142_equation_0, values = (var_3966_cast_fp16, var_4119_cast_fp16))[name = tensor("op_4142_cast_fp16")]; tensor var_4144_equation_0 = const()[name = tensor("op_4144_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4144_cast_fp16 = einsum(equation = var_4144_equation_0, values = (var_3970_cast_fp16, var_4120_cast_fp16))[name = tensor("op_4144_cast_fp16")]; tensor var_4146_equation_0 = const()[name = tensor("op_4146_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4146_cast_fp16 = einsum(equation = var_4146_equation_0, values = (var_3974_cast_fp16, var_4121_cast_fp16))[name = tensor("op_4146_cast_fp16")]; tensor var_4148_equation_0 = const()[name = tensor("op_4148_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4148_cast_fp16 = einsum(equation = var_4148_equation_0, values = (var_3978_cast_fp16, var_4122_cast_fp16))[name = tensor("op_4148_cast_fp16")]; tensor var_4150_equation_0 = const()[name = tensor("op_4150_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4150_cast_fp16 = einsum(equation = var_4150_equation_0, values = (var_3982_cast_fp16, var_4123_cast_fp16))[name = tensor("op_4150_cast_fp16")]; tensor var_4152_equation_0 = const()[name = tensor("op_4152_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4152_cast_fp16 = einsum(equation = var_4152_equation_0, values = (var_3986_cast_fp16, var_4124_cast_fp16))[name = tensor("op_4152_cast_fp16")]; tensor var_4154_equation_0 = const()[name = tensor("op_4154_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4154_cast_fp16 = einsum(equation = var_4154_equation_0, values = (var_3990_cast_fp16, var_4125_cast_fp16))[name = tensor("op_4154_cast_fp16")]; tensor var_4156_equation_0 = const()[name = tensor("op_4156_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4156_cast_fp16 = einsum(equation = var_4156_equation_0, values = (var_3994_cast_fp16, var_4126_cast_fp16))[name = tensor("op_4156_cast_fp16")]; tensor var_4158_equation_0 = const()[name = tensor("op_4158_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4158_cast_fp16 = einsum(equation = var_4158_equation_0, values = (var_3998_cast_fp16, var_4127_cast_fp16))[name = tensor("op_4158_cast_fp16")]; tensor var_4160_equation_0 = const()[name = tensor("op_4160_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4160_cast_fp16 = einsum(equation = var_4160_equation_0, values = (var_4002_cast_fp16, var_4128_cast_fp16))[name = tensor("op_4160_cast_fp16")]; tensor var_4162_equation_0 = const()[name = tensor("op_4162_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4162_cast_fp16 = einsum(equation = var_4162_equation_0, values = (var_4006_cast_fp16, var_4129_cast_fp16))[name = tensor("op_4162_cast_fp16")]; tensor var_4164_equation_0 = const()[name = tensor("op_4164_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4164_cast_fp16 = einsum(equation = var_4164_equation_0, values = (var_4010_cast_fp16, var_4130_cast_fp16))[name = tensor("op_4164_cast_fp16")]; tensor var_4166_equation_0 = const()[name = tensor("op_4166_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4166_cast_fp16 = einsum(equation = var_4166_equation_0, values = (var_4014_cast_fp16, var_4131_cast_fp16))[name = tensor("op_4166_cast_fp16")]; tensor var_4168_equation_0 = const()[name = tensor("op_4168_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4168_cast_fp16 = einsum(equation = var_4168_equation_0, values = (var_4018_cast_fp16, var_4132_cast_fp16))[name = tensor("op_4168_cast_fp16")]; tensor var_4170_equation_0 = const()[name = tensor("op_4170_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4170_cast_fp16 = einsum(equation = var_4170_equation_0, values = (var_4022_cast_fp16, var_4133_cast_fp16))[name = tensor("op_4170_cast_fp16")]; tensor var_4172_equation_0 = const()[name = tensor("op_4172_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4172_cast_fp16 = einsum(equation = var_4172_equation_0, values = (var_4026_cast_fp16, var_4134_cast_fp16))[name = tensor("op_4172_cast_fp16")]; tensor var_4174_equation_0 = const()[name = tensor("op_4174_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4174_cast_fp16 = einsum(equation = var_4174_equation_0, values = (var_4030_cast_fp16, var_4135_cast_fp16))[name = tensor("op_4174_cast_fp16")]; tensor var_4176_equation_0 = const()[name = tensor("op_4176_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4176_cast_fp16 = einsum(equation = var_4176_equation_0, values = (var_4034_cast_fp16, var_4136_cast_fp16))[name = tensor("op_4176_cast_fp16")]; tensor input_161_interleave_0 = const()[name = tensor("input_161_interleave_0"), val = tensor(false)]; tensor input_161_cast_fp16 = concat(axis = var_2254, interleave = input_161_interleave_0, values = (var_4138_cast_fp16, var_4140_cast_fp16, var_4142_cast_fp16, var_4144_cast_fp16, var_4146_cast_fp16, var_4148_cast_fp16, var_4150_cast_fp16, var_4152_cast_fp16, var_4154_cast_fp16, var_4156_cast_fp16, var_4158_cast_fp16, var_4160_cast_fp16, var_4162_cast_fp16, var_4164_cast_fp16, var_4166_cast_fp16, var_4168_cast_fp16, var_4170_cast_fp16, var_4172_cast_fp16, var_4174_cast_fp16, var_4176_cast_fp16))[name = tensor("input_161_cast_fp16")]; tensor var_4182 = const()[name = tensor("op_4182"), val = tensor([1, 1])]; tensor var_4184 = const()[name = tensor("op_4184"), val = tensor([1, 1])]; tensor var_4186_pad_type_0 = const()[name = tensor("op_4186_pad_type_0"), val = tensor("custom")]; tensor var_4186_pad_0 = const()[name = tensor("op_4186_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(308004672)))]; tensor down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(311281536)))]; tensor var_4186_cast_fp16 = conv(bias = down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_4184, groups = var_2254, pad = var_4186_pad_0, pad_type = var_4186_pad_type_0, strides = var_4182, weight = down_blocks_2_attentions_1_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_161_cast_fp16)[name = tensor("op_4186_cast_fp16")]; tensor inputs_35_cast_fp16 = add(x = var_4186_cast_fp16, y = inputs_33_cast_fp16)[name = tensor("inputs_35_cast_fp16")]; tensor var_4190 = const()[name = tensor("op_4190"), val = tensor([1])]; tensor channels_mean_35_cast_fp16 = reduce_mean(axes = var_4190, keep_dims = var_2249, x = inputs_35_cast_fp16)[name = tensor("channels_mean_35_cast_fp16")]; tensor zero_mean_35_cast_fp16 = sub(x = inputs_35_cast_fp16, y = channels_mean_35_cast_fp16)[name = tensor("zero_mean_35_cast_fp16")]; tensor zero_mean_sq_35_cast_fp16 = mul(x = zero_mean_35_cast_fp16, y = zero_mean_35_cast_fp16)[name = tensor("zero_mean_sq_35_cast_fp16")]; tensor var_4194 = const()[name = tensor("op_4194"), val = tensor([1])]; tensor var_4195_cast_fp16 = reduce_mean(axes = var_4194, keep_dims = var_2249, x = zero_mean_sq_35_cast_fp16)[name = tensor("op_4195_cast_fp16")]; tensor var_4196_to_fp16 = const()[name = tensor("op_4196_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4197_cast_fp16 = add(x = var_4195_cast_fp16, y = var_4196_to_fp16)[name = tensor("op_4197_cast_fp16")]; tensor denom_35_epsilon_0_to_fp16 = const()[name = tensor("denom_35_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_35_cast_fp16 = rsqrt(epsilon = denom_35_epsilon_0_to_fp16, x = var_4197_cast_fp16)[name = tensor("denom_35_cast_fp16")]; tensor out_35_cast_fp16 = mul(x = zero_mean_35_cast_fp16, y = denom_35_cast_fp16)[name = tensor("out_35_cast_fp16")]; tensor var_4201_to_fp16 = const()[name = tensor("op_4201_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(311284160)))]; tensor var_4202_cast_fp16 = add(x = out_35_cast_fp16, y = var_4201_to_fp16)[name = tensor("op_4202_cast_fp16")]; tensor var_4204_to_fp16 = const()[name = tensor("op_4204_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(311286784)))]; tensor input_163_cast_fp16 = mul(x = var_4202_cast_fp16, y = var_4204_to_fp16)[name = tensor("input_163_cast_fp16")]; tensor var_4212 = const()[name = tensor("op_4212"), val = tensor([1, 1])]; tensor var_4214 = const()[name = tensor("op_4214"), val = tensor([1, 1])]; tensor var_4216_pad_type_0 = const()[name = tensor("op_4216_pad_type_0"), val = tensor("custom")]; tensor var_4216_pad_0 = const()[name = tensor("op_4216_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(311289408)))]; tensor down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337503872)))]; tensor var_4216_cast_fp16 = conv(bias = down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_4214, groups = var_2254, pad = var_4216_pad_0, pad_type = var_4216_pad_type_0, strides = var_4212, weight = down_blocks_2_attentions_1_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_163_cast_fp16)[name = tensor("op_4216_cast_fp16")]; tensor var_4217_split_sizes_0 = const()[name = tensor("op_4217_split_sizes_0"), val = tensor([5120, 5120])]; tensor var_4217_axis_0 = const()[name = tensor("op_4217_axis_0"), val = tensor(1)]; tensor var_4217_cast_fp16_0, tensor var_4217_cast_fp16_1 = split(axis = var_4217_axis_0, split_sizes = var_4217_split_sizes_0, x = var_4216_cast_fp16)[name = tensor("op_4217_cast_fp16")]; tensor var_4219_mode_0 = const()[name = tensor("op_4219_mode_0"), val = tensor("EXACT")]; tensor var_4219_cast_fp16 = gelu(mode = var_4219_mode_0, x = var_4217_cast_fp16_1)[name = tensor("op_4219_cast_fp16")]; tensor input_165_cast_fp16 = mul(x = var_4217_cast_fp16_0, y = var_4219_cast_fp16)[name = tensor("input_165_cast_fp16")]; tensor var_4223 = const()[name = tensor("op_4223"), val = tensor([1, 1])]; tensor var_4225 = const()[name = tensor("op_4225"), val = tensor([1, 1])]; tensor var_4227_pad_type_0 = const()[name = tensor("op_4227_pad_type_0"), val = tensor("custom")]; tensor var_4227_pad_0 = const()[name = tensor("op_4227_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337524416)))]; tensor down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350631680)))]; tensor var_4227_cast_fp16 = conv(bias = down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_4225, groups = var_2254, pad = var_4227_pad_0, pad_type = var_4227_pad_type_0, strides = var_4223, weight = down_blocks_2_attentions_1_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_165_cast_fp16)[name = tensor("op_4227_cast_fp16")]; tensor hidden_states_105_cast_fp16 = add(x = var_4227_cast_fp16, y = inputs_35_cast_fp16)[name = tensor("hidden_states_105_cast_fp16")]; tensor var_4229 = const()[name = tensor("op_4229"), val = tensor([2, 1280, 12, 12])]; tensor input_167_cast_fp16 = reshape(shape = var_4229, x = hidden_states_105_cast_fp16)[name = tensor("input_167_cast_fp16")]; tensor var_4233 = const()[name = tensor("op_4233"), val = tensor([1, 1])]; tensor var_4235 = const()[name = tensor("op_4235"), val = tensor([1, 1])]; tensor hidden_states_107_pad_type_0 = const()[name = tensor("hidden_states_107_pad_type_0"), val = tensor("custom")]; tensor hidden_states_107_pad_0 = const()[name = tensor("hidden_states_107_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_2_attentions_1_proj_out_weight_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(350634304)))]; tensor down_blocks_2_attentions_1_proj_out_bias_to_fp16 = const()[name = tensor("down_blocks_2_attentions_1_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(353911168)))]; tensor hidden_states_107_cast_fp16 = conv(bias = down_blocks_2_attentions_1_proj_out_bias_to_fp16, dilations = var_4235, groups = var_2254, pad = hidden_states_107_pad_0, pad_type = hidden_states_107_pad_type_0, strides = var_4233, weight = down_blocks_2_attentions_1_proj_out_weight_to_fp16, x = input_167_cast_fp16)[name = tensor("hidden_states_107_cast_fp16")]; tensor input_169_cast_fp16_1 = add(x = hidden_states_107_cast_fp16, y = hidden_states_95_cast_fp16)[name = tensor("input_169_cast_fp16")]; tensor var_4242 = const()[name = tensor("op_4242"), val = tensor([2, 2])]; tensor var_4244 = const()[name = tensor("op_4244"), val = tensor([1, 1])]; tensor input_171_pad_type_0 = const()[name = tensor("input_171_pad_type_0"), val = tensor("custom")]; tensor input_171_pad_0 = const()[name = tensor("input_171_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_2_downsamplers_0_conv_weight_to_fp16 = const()[name = tensor("down_blocks_2_downsamplers_0_conv_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(353913792)))]; tensor down_blocks_2_downsamplers_0_conv_bias_to_fp16 = const()[name = tensor("down_blocks_2_downsamplers_0_conv_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(383405056)))]; tensor input_171_cast_fp16_1 = conv(bias = down_blocks_2_downsamplers_0_conv_bias_to_fp16, dilations = var_4244, groups = var_2254, pad = input_171_pad_0, pad_type = input_171_pad_type_0, strides = var_4242, weight = down_blocks_2_downsamplers_0_conv_weight_to_fp16, x = input_169_cast_fp16_1)[name = tensor("input_171_cast_fp16")]; tensor var_4256 = const()[name = tensor("op_4256"), val = tensor(1)]; tensor reshape_72_shape_0 = const()[name = tensor("reshape_72_shape_0"), val = tensor([2, 32, 40, 6, 6])]; tensor reshape_72_cast_fp16 = reshape(shape = reshape_72_shape_0, x = input_171_cast_fp16_1)[name = tensor("reshape_72_cast_fp16")]; tensor reduce_mean_54_axes_0 = const()[name = tensor("reduce_mean_54_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_54_keep_dims_0 = const()[name = tensor("reduce_mean_54_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_54_cast_fp16 = reduce_mean(axes = reduce_mean_54_axes_0, keep_dims = reduce_mean_54_keep_dims_0, x = reshape_72_cast_fp16)[name = tensor("reduce_mean_54_cast_fp16")]; tensor sub_36_cast_fp16 = sub(x = reshape_72_cast_fp16, y = reduce_mean_54_cast_fp16)[name = tensor("sub_36_cast_fp16")]; tensor square_18_cast_fp16 = square(x = sub_36_cast_fp16)[name = tensor("square_18_cast_fp16")]; tensor reduce_mean_56_axes_0 = const()[name = tensor("reduce_mean_56_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_56_keep_dims_0 = const()[name = tensor("reduce_mean_56_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_56_cast_fp16 = reduce_mean(axes = reduce_mean_56_axes_0, keep_dims = reduce_mean_56_keep_dims_0, x = square_18_cast_fp16)[name = tensor("reduce_mean_56_cast_fp16")]; tensor add_36_y_0_to_fp16 = const()[name = tensor("add_36_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_36_cast_fp16 = add(x = reduce_mean_56_cast_fp16, y = add_36_y_0_to_fp16)[name = tensor("add_36_cast_fp16")]; tensor sqrt_18_cast_fp16 = sqrt(x = add_36_cast_fp16)[name = tensor("sqrt_18_cast_fp16")]; tensor real_div_18_cast_fp16 = real_div(x = sub_36_cast_fp16, y = sqrt_18_cast_fp16)[name = tensor("real_div_18_cast_fp16")]; tensor reshape_73_shape_0 = const()[name = tensor("reshape_73_shape_0"), val = tensor([2, 1280, 6, 6])]; tensor reshape_73_cast_fp16 = reshape(shape = reshape_73_shape_0, x = real_div_18_cast_fp16)[name = tensor("reshape_73_cast_fp16")]; tensor add_37_gamma_0_to_fp16 = const()[name = tensor("add_37_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(383407680)))]; tensor add_37_beta_0_to_fp16 = const()[name = tensor("add_37_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(383410304)))]; tensor add_37_epsilon_0_to_fp16 = const()[name = tensor("add_37_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_37_cast_fp16 = batch_norm(beta = add_37_beta_0_to_fp16, epsilon = add_37_epsilon_0_to_fp16, gamma = add_37_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_73_cast_fp16)[name = tensor("add_37_cast_fp16")]; tensor input_175_cast_fp16 = silu(x = add_37_cast_fp16)[name = tensor("input_175_cast_fp16")]; tensor var_4272 = const()[name = tensor("op_4272"), val = tensor([1, 1])]; tensor var_4274 = const()[name = tensor("op_4274"), val = tensor([1, 1])]; tensor hidden_states_109_pad_type_0 = const()[name = tensor("hidden_states_109_pad_type_0"), val = tensor("custom")]; tensor hidden_states_109_pad_0 = const()[name = tensor("hidden_states_109_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_3_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(383412928)))]; tensor down_blocks_3_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412904192)))]; tensor hidden_states_109_cast_fp16 = conv(bias = down_blocks_3_resnets_0_conv1_bias_to_fp16, dilations = var_4274, groups = var_4256, pad = hidden_states_109_pad_0, pad_type = hidden_states_109_pad_type_0, strides = var_4272, weight = down_blocks_3_resnets_0_conv1_weight_to_fp16, x = input_175_cast_fp16)[name = tensor("hidden_states_109_cast_fp16")]; tensor var_4280 = const()[name = tensor("op_4280"), val = tensor([1, 1])]; tensor var_4282 = const()[name = tensor("op_4282"), val = tensor([1, 1])]; tensor temb_13_pad_type_0 = const()[name = tensor("temb_13_pad_type_0"), val = tensor("custom")]; tensor temb_13_pad_0 = const()[name = tensor("temb_13_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_3_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412906816)))]; tensor down_blocks_3_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416183680)))]; tensor temb_13_cast_fp16 = conv(bias = down_blocks_3_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_4282, groups = var_4256, pad = temb_13_pad_0, pad_type = temb_13_pad_type_0, strides = var_4280, weight = down_blocks_3_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_13_cast_fp16")]; tensor input_179_cast_fp16 = add(x = hidden_states_109_cast_fp16, y = temb_13_cast_fp16)[name = tensor("input_179_cast_fp16")]; tensor reshape_76_shape_0 = const()[name = tensor("reshape_76_shape_0"), val = tensor([2, 32, 40, 6, 6])]; tensor reshape_76_cast_fp16 = reshape(shape = reshape_76_shape_0, x = input_179_cast_fp16)[name = tensor("reshape_76_cast_fp16")]; tensor reduce_mean_57_axes_0 = const()[name = tensor("reduce_mean_57_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_57_keep_dims_0 = const()[name = tensor("reduce_mean_57_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_57_cast_fp16 = reduce_mean(axes = reduce_mean_57_axes_0, keep_dims = reduce_mean_57_keep_dims_0, x = reshape_76_cast_fp16)[name = tensor("reduce_mean_57_cast_fp16")]; tensor sub_38_cast_fp16 = sub(x = reshape_76_cast_fp16, y = reduce_mean_57_cast_fp16)[name = tensor("sub_38_cast_fp16")]; tensor square_19_cast_fp16 = square(x = sub_38_cast_fp16)[name = tensor("square_19_cast_fp16")]; tensor reduce_mean_59_axes_0 = const()[name = tensor("reduce_mean_59_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_59_keep_dims_0 = const()[name = tensor("reduce_mean_59_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_59_cast_fp16 = reduce_mean(axes = reduce_mean_59_axes_0, keep_dims = reduce_mean_59_keep_dims_0, x = square_19_cast_fp16)[name = tensor("reduce_mean_59_cast_fp16")]; tensor add_38_y_0_to_fp16 = const()[name = tensor("add_38_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_38_cast_fp16 = add(x = reduce_mean_59_cast_fp16, y = add_38_y_0_to_fp16)[name = tensor("add_38_cast_fp16")]; tensor sqrt_19_cast_fp16 = sqrt(x = add_38_cast_fp16)[name = tensor("sqrt_19_cast_fp16")]; tensor real_div_19_cast_fp16 = real_div(x = sub_38_cast_fp16, y = sqrt_19_cast_fp16)[name = tensor("real_div_19_cast_fp16")]; tensor reshape_77_shape_0 = const()[name = tensor("reshape_77_shape_0"), val = tensor([2, 1280, 6, 6])]; tensor reshape_77_cast_fp16 = reshape(shape = reshape_77_shape_0, x = real_div_19_cast_fp16)[name = tensor("reshape_77_cast_fp16")]; tensor add_39_gamma_0_to_fp16 = const()[name = tensor("add_39_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416186304)))]; tensor add_39_beta_0_to_fp16 = const()[name = tensor("add_39_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416188928)))]; tensor add_39_epsilon_0_to_fp16 = const()[name = tensor("add_39_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_39_cast_fp16 = batch_norm(beta = add_39_beta_0_to_fp16, epsilon = add_39_epsilon_0_to_fp16, gamma = add_39_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_77_cast_fp16)[name = tensor("add_39_cast_fp16")]; tensor input_183_cast_fp16 = silu(x = add_39_cast_fp16)[name = tensor("input_183_cast_fp16")]; tensor var_4292 = const()[name = tensor("op_4292"), val = tensor([1, 1])]; tensor var_4294 = const()[name = tensor("op_4294"), val = tensor([1, 1])]; tensor hidden_states_111_pad_type_0 = const()[name = tensor("hidden_states_111_pad_type_0"), val = tensor("custom")]; tensor hidden_states_111_pad_0 = const()[name = tensor("hidden_states_111_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_3_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(416191552)))]; tensor down_blocks_3_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445682816)))]; tensor hidden_states_111_cast_fp16 = conv(bias = down_blocks_3_resnets_0_conv2_bias_to_fp16, dilations = var_4294, groups = var_4256, pad = hidden_states_111_pad_0, pad_type = hidden_states_111_pad_type_0, strides = var_4292, weight = down_blocks_3_resnets_0_conv2_weight_to_fp16, x = input_183_cast_fp16)[name = tensor("hidden_states_111_cast_fp16")]; tensor input_185_cast_fp16 = add(x = input_171_cast_fp16_1, y = hidden_states_111_cast_fp16)[name = tensor("input_185_cast_fp16")]; tensor reshape_80_shape_0 = const()[name = tensor("reshape_80_shape_0"), val = tensor([2, 32, 40, 6, 6])]; tensor reshape_80_cast_fp16 = reshape(shape = reshape_80_shape_0, x = input_185_cast_fp16)[name = tensor("reshape_80_cast_fp16")]; tensor reduce_mean_60_axes_0 = const()[name = tensor("reduce_mean_60_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_60_keep_dims_0 = const()[name = tensor("reduce_mean_60_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_60_cast_fp16 = reduce_mean(axes = reduce_mean_60_axes_0, keep_dims = reduce_mean_60_keep_dims_0, x = reshape_80_cast_fp16)[name = tensor("reduce_mean_60_cast_fp16")]; tensor sub_40_cast_fp16 = sub(x = reshape_80_cast_fp16, y = reduce_mean_60_cast_fp16)[name = tensor("sub_40_cast_fp16")]; tensor square_20_cast_fp16 = square(x = sub_40_cast_fp16)[name = tensor("square_20_cast_fp16")]; tensor reduce_mean_62_axes_0 = const()[name = tensor("reduce_mean_62_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_62_keep_dims_0 = const()[name = tensor("reduce_mean_62_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_62_cast_fp16 = reduce_mean(axes = reduce_mean_62_axes_0, keep_dims = reduce_mean_62_keep_dims_0, x = square_20_cast_fp16)[name = tensor("reduce_mean_62_cast_fp16")]; tensor add_40_y_0_to_fp16 = const()[name = tensor("add_40_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_40_cast_fp16 = add(x = reduce_mean_62_cast_fp16, y = add_40_y_0_to_fp16)[name = tensor("add_40_cast_fp16")]; tensor sqrt_20_cast_fp16 = sqrt(x = add_40_cast_fp16)[name = tensor("sqrt_20_cast_fp16")]; tensor real_div_20_cast_fp16 = real_div(x = sub_40_cast_fp16, y = sqrt_20_cast_fp16)[name = tensor("real_div_20_cast_fp16")]; tensor reshape_81_shape_0 = const()[name = tensor("reshape_81_shape_0"), val = tensor([2, 1280, 6, 6])]; tensor reshape_81_cast_fp16 = reshape(shape = reshape_81_shape_0, x = real_div_20_cast_fp16)[name = tensor("reshape_81_cast_fp16")]; tensor add_41_gamma_0_to_fp16 = const()[name = tensor("add_41_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445685440)))]; tensor add_41_beta_0_to_fp16 = const()[name = tensor("add_41_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445688064)))]; tensor add_41_epsilon_0_to_fp16 = const()[name = tensor("add_41_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_41_cast_fp16 = batch_norm(beta = add_41_beta_0_to_fp16, epsilon = add_41_epsilon_0_to_fp16, gamma = add_41_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_81_cast_fp16)[name = tensor("add_41_cast_fp16")]; tensor input_189_cast_fp16 = silu(x = add_41_cast_fp16)[name = tensor("input_189_cast_fp16")]; tensor var_4309 = const()[name = tensor("op_4309"), val = tensor([1, 1])]; tensor var_4311 = const()[name = tensor("op_4311"), val = tensor([1, 1])]; tensor hidden_states_113_pad_type_0 = const()[name = tensor("hidden_states_113_pad_type_0"), val = tensor("custom")]; tensor hidden_states_113_pad_0 = const()[name = tensor("hidden_states_113_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_3_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(445690688)))]; tensor down_blocks_3_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(475181952)))]; tensor hidden_states_113_cast_fp16 = conv(bias = down_blocks_3_resnets_1_conv1_bias_to_fp16, dilations = var_4311, groups = var_4256, pad = hidden_states_113_pad_0, pad_type = hidden_states_113_pad_type_0, strides = var_4309, weight = down_blocks_3_resnets_1_conv1_weight_to_fp16, x = input_189_cast_fp16)[name = tensor("hidden_states_113_cast_fp16")]; tensor var_4317 = const()[name = tensor("op_4317"), val = tensor([1, 1])]; tensor var_4319 = const()[name = tensor("op_4319"), val = tensor([1, 1])]; tensor temb_15_pad_type_0 = const()[name = tensor("temb_15_pad_type_0"), val = tensor("custom")]; tensor temb_15_pad_0 = const()[name = tensor("temb_15_pad_0"), val = tensor([0, 0, 0, 0])]; tensor down_blocks_3_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(475184576)))]; tensor down_blocks_3_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478461440)))]; tensor temb_15_cast_fp16 = conv(bias = down_blocks_3_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_4319, groups = var_4256, pad = temb_15_pad_0, pad_type = temb_15_pad_type_0, strides = var_4317, weight = down_blocks_3_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_15_cast_fp16")]; tensor input_193_cast_fp16 = add(x = hidden_states_113_cast_fp16, y = temb_15_cast_fp16)[name = tensor("input_193_cast_fp16")]; tensor reshape_84_shape_0 = const()[name = tensor("reshape_84_shape_0"), val = tensor([2, 32, 40, 6, 6])]; tensor reshape_84_cast_fp16 = reshape(shape = reshape_84_shape_0, x = input_193_cast_fp16)[name = tensor("reshape_84_cast_fp16")]; tensor reduce_mean_63_axes_0 = const()[name = tensor("reduce_mean_63_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_63_keep_dims_0 = const()[name = tensor("reduce_mean_63_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_63_cast_fp16 = reduce_mean(axes = reduce_mean_63_axes_0, keep_dims = reduce_mean_63_keep_dims_0, x = reshape_84_cast_fp16)[name = tensor("reduce_mean_63_cast_fp16")]; tensor sub_42_cast_fp16 = sub(x = reshape_84_cast_fp16, y = reduce_mean_63_cast_fp16)[name = tensor("sub_42_cast_fp16")]; tensor square_21_cast_fp16 = square(x = sub_42_cast_fp16)[name = tensor("square_21_cast_fp16")]; tensor reduce_mean_65_axes_0 = const()[name = tensor("reduce_mean_65_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_65_keep_dims_0 = const()[name = tensor("reduce_mean_65_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_65_cast_fp16 = reduce_mean(axes = reduce_mean_65_axes_0, keep_dims = reduce_mean_65_keep_dims_0, x = square_21_cast_fp16)[name = tensor("reduce_mean_65_cast_fp16")]; tensor add_42_y_0_to_fp16 = const()[name = tensor("add_42_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_42_cast_fp16 = add(x = reduce_mean_65_cast_fp16, y = add_42_y_0_to_fp16)[name = tensor("add_42_cast_fp16")]; tensor sqrt_21_cast_fp16 = sqrt(x = add_42_cast_fp16)[name = tensor("sqrt_21_cast_fp16")]; tensor real_div_21_cast_fp16 = real_div(x = sub_42_cast_fp16, y = sqrt_21_cast_fp16)[name = tensor("real_div_21_cast_fp16")]; tensor reshape_85_shape_0 = const()[name = tensor("reshape_85_shape_0"), val = tensor([2, 1280, 6, 6])]; tensor reshape_85_cast_fp16 = reshape(shape = reshape_85_shape_0, x = real_div_21_cast_fp16)[name = tensor("reshape_85_cast_fp16")]; tensor add_43_gamma_0_to_fp16 = const()[name = tensor("add_43_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478464064)))]; tensor add_43_beta_0_to_fp16 = const()[name = tensor("add_43_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478466688)))]; tensor add_43_epsilon_0_to_fp16 = const()[name = tensor("add_43_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_43_cast_fp16 = batch_norm(beta = add_43_beta_0_to_fp16, epsilon = add_43_epsilon_0_to_fp16, gamma = add_43_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_85_cast_fp16)[name = tensor("add_43_cast_fp16")]; tensor input_197_cast_fp16 = silu(x = add_43_cast_fp16)[name = tensor("input_197_cast_fp16")]; tensor var_4329 = const()[name = tensor("op_4329"), val = tensor([1, 1])]; tensor var_4331 = const()[name = tensor("op_4331"), val = tensor([1, 1])]; tensor hidden_states_115_pad_type_0 = const()[name = tensor("hidden_states_115_pad_type_0"), val = tensor("custom")]; tensor hidden_states_115_pad_0 = const()[name = tensor("hidden_states_115_pad_0"), val = tensor([1, 1, 1, 1])]; tensor down_blocks_3_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(478469312)))]; tensor down_blocks_3_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("down_blocks_3_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(507960576)))]; tensor hidden_states_115_cast_fp16 = conv(bias = down_blocks_3_resnets_1_conv2_bias_to_fp16, dilations = var_4331, groups = var_4256, pad = hidden_states_115_pad_0, pad_type = hidden_states_115_pad_type_0, strides = var_4329, weight = down_blocks_3_resnets_1_conv2_weight_to_fp16, x = input_197_cast_fp16)[name = tensor("hidden_states_115_cast_fp16")]; tensor input_199_cast_fp16 = add(x = input_185_cast_fp16, y = hidden_states_115_cast_fp16)[name = tensor("input_199_cast_fp16")]; tensor var_4366 = const()[name = tensor("op_4366"), val = tensor(true)]; tensor var_4371 = const()[name = tensor("op_4371"), val = tensor(1)]; tensor reshape_88_shape_0 = const()[name = tensor("reshape_88_shape_0"), val = tensor([2, 32, 40, 6, 6])]; tensor reshape_88_cast_fp16 = reshape(shape = reshape_88_shape_0, x = input_199_cast_fp16)[name = tensor("reshape_88_cast_fp16")]; tensor reduce_mean_66_axes_0 = const()[name = tensor("reduce_mean_66_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_66_keep_dims_0 = const()[name = tensor("reduce_mean_66_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_66_cast_fp16 = reduce_mean(axes = reduce_mean_66_axes_0, keep_dims = reduce_mean_66_keep_dims_0, x = reshape_88_cast_fp16)[name = tensor("reduce_mean_66_cast_fp16")]; tensor sub_44_cast_fp16 = sub(x = reshape_88_cast_fp16, y = reduce_mean_66_cast_fp16)[name = tensor("sub_44_cast_fp16")]; tensor square_22_cast_fp16 = square(x = sub_44_cast_fp16)[name = tensor("square_22_cast_fp16")]; tensor reduce_mean_68_axes_0 = const()[name = tensor("reduce_mean_68_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_68_keep_dims_0 = const()[name = tensor("reduce_mean_68_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_68_cast_fp16 = reduce_mean(axes = reduce_mean_68_axes_0, keep_dims = reduce_mean_68_keep_dims_0, x = square_22_cast_fp16)[name = tensor("reduce_mean_68_cast_fp16")]; tensor add_44_y_0_to_fp16 = const()[name = tensor("add_44_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_44_cast_fp16 = add(x = reduce_mean_68_cast_fp16, y = add_44_y_0_to_fp16)[name = tensor("add_44_cast_fp16")]; tensor sqrt_22_cast_fp16 = sqrt(x = add_44_cast_fp16)[name = tensor("sqrt_22_cast_fp16")]; tensor real_div_22_cast_fp16 = real_div(x = sub_44_cast_fp16, y = sqrt_22_cast_fp16)[name = tensor("real_div_22_cast_fp16")]; tensor reshape_89_shape_0 = const()[name = tensor("reshape_89_shape_0"), val = tensor([2, 1280, 6, 6])]; tensor reshape_89_cast_fp16 = reshape(shape = reshape_89_shape_0, x = real_div_22_cast_fp16)[name = tensor("reshape_89_cast_fp16")]; tensor add_45_gamma_0_to_fp16 = const()[name = tensor("add_45_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(507963200)))]; tensor add_45_beta_0_to_fp16 = const()[name = tensor("add_45_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(507965824)))]; tensor add_45_epsilon_0_to_fp16 = const()[name = tensor("add_45_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_45_cast_fp16 = batch_norm(beta = add_45_beta_0_to_fp16, epsilon = add_45_epsilon_0_to_fp16, gamma = add_45_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_89_cast_fp16)[name = tensor("add_45_cast_fp16")]; tensor input_203_cast_fp16 = silu(x = add_45_cast_fp16)[name = tensor("input_203_cast_fp16")]; tensor var_4389 = const()[name = tensor("op_4389"), val = tensor([1, 1])]; tensor var_4391 = const()[name = tensor("op_4391"), val = tensor([1, 1])]; tensor hidden_states_117_pad_type_0 = const()[name = tensor("hidden_states_117_pad_type_0"), val = tensor("custom")]; tensor hidden_states_117_pad_0 = const()[name = tensor("hidden_states_117_pad_0"), val = tensor([1, 1, 1, 1])]; tensor mid_block_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("mid_block_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(507968448)))]; tensor mid_block_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("mid_block_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(537459712)))]; tensor hidden_states_117_cast_fp16 = conv(bias = mid_block_resnets_0_conv1_bias_to_fp16, dilations = var_4391, groups = var_4371, pad = hidden_states_117_pad_0, pad_type = hidden_states_117_pad_type_0, strides = var_4389, weight = mid_block_resnets_0_conv1_weight_to_fp16, x = input_203_cast_fp16)[name = tensor("hidden_states_117_cast_fp16")]; tensor var_4397 = const()[name = tensor("op_4397"), val = tensor([1, 1])]; tensor var_4399 = const()[name = tensor("op_4399"), val = tensor([1, 1])]; tensor temb_17_pad_type_0 = const()[name = tensor("temb_17_pad_type_0"), val = tensor("custom")]; tensor temb_17_pad_0 = const()[name = tensor("temb_17_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("mid_block_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(537462336)))]; tensor mid_block_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("mid_block_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(540739200)))]; tensor temb_17_cast_fp16 = conv(bias = mid_block_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_4399, groups = var_4371, pad = temb_17_pad_0, pad_type = temb_17_pad_type_0, strides = var_4397, weight = mid_block_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_17_cast_fp16")]; tensor input_207_cast_fp16 = add(x = hidden_states_117_cast_fp16, y = temb_17_cast_fp16)[name = tensor("input_207_cast_fp16")]; tensor reshape_92_shape_0 = const()[name = tensor("reshape_92_shape_0"), val = tensor([2, 32, 40, 6, 6])]; tensor reshape_92_cast_fp16 = reshape(shape = reshape_92_shape_0, x = input_207_cast_fp16)[name = tensor("reshape_92_cast_fp16")]; tensor reduce_mean_69_axes_0 = const()[name = tensor("reduce_mean_69_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_69_keep_dims_0 = const()[name = tensor("reduce_mean_69_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_69_cast_fp16 = reduce_mean(axes = reduce_mean_69_axes_0, keep_dims = reduce_mean_69_keep_dims_0, x = reshape_92_cast_fp16)[name = tensor("reduce_mean_69_cast_fp16")]; tensor sub_46_cast_fp16 = sub(x = reshape_92_cast_fp16, y = reduce_mean_69_cast_fp16)[name = tensor("sub_46_cast_fp16")]; tensor square_23_cast_fp16 = square(x = sub_46_cast_fp16)[name = tensor("square_23_cast_fp16")]; tensor reduce_mean_71_axes_0 = const()[name = tensor("reduce_mean_71_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_71_keep_dims_0 = const()[name = tensor("reduce_mean_71_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_71_cast_fp16 = reduce_mean(axes = reduce_mean_71_axes_0, keep_dims = reduce_mean_71_keep_dims_0, x = square_23_cast_fp16)[name = tensor("reduce_mean_71_cast_fp16")]; tensor add_46_y_0_to_fp16 = const()[name = tensor("add_46_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_46_cast_fp16 = add(x = reduce_mean_71_cast_fp16, y = add_46_y_0_to_fp16)[name = tensor("add_46_cast_fp16")]; tensor sqrt_23_cast_fp16 = sqrt(x = add_46_cast_fp16)[name = tensor("sqrt_23_cast_fp16")]; tensor real_div_23_cast_fp16 = real_div(x = sub_46_cast_fp16, y = sqrt_23_cast_fp16)[name = tensor("real_div_23_cast_fp16")]; tensor reshape_93_shape_0 = const()[name = tensor("reshape_93_shape_0"), val = tensor([2, 1280, 6, 6])]; tensor reshape_93_cast_fp16 = reshape(shape = reshape_93_shape_0, x = real_div_23_cast_fp16)[name = tensor("reshape_93_cast_fp16")]; tensor add_47_gamma_0_to_fp16 = const()[name = tensor("add_47_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(540741824)))]; tensor add_47_beta_0_to_fp16 = const()[name = tensor("add_47_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(540744448)))]; tensor add_47_epsilon_0_to_fp16 = const()[name = tensor("add_47_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_47_cast_fp16 = batch_norm(beta = add_47_beta_0_to_fp16, epsilon = add_47_epsilon_0_to_fp16, gamma = add_47_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_93_cast_fp16)[name = tensor("add_47_cast_fp16")]; tensor input_211_cast_fp16 = silu(x = add_47_cast_fp16)[name = tensor("input_211_cast_fp16")]; tensor var_4409 = const()[name = tensor("op_4409"), val = tensor([1, 1])]; tensor var_4411 = const()[name = tensor("op_4411"), val = tensor([1, 1])]; tensor hidden_states_119_pad_type_0 = const()[name = tensor("hidden_states_119_pad_type_0"), val = tensor("custom")]; tensor hidden_states_119_pad_0 = const()[name = tensor("hidden_states_119_pad_0"), val = tensor([1, 1, 1, 1])]; tensor mid_block_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("mid_block_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(540747072)))]; tensor mid_block_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("mid_block_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570238336)))]; tensor hidden_states_119_cast_fp16 = conv(bias = mid_block_resnets_0_conv2_bias_to_fp16, dilations = var_4411, groups = var_4371, pad = hidden_states_119_pad_0, pad_type = hidden_states_119_pad_type_0, strides = var_4409, weight = mid_block_resnets_0_conv2_weight_to_fp16, x = input_211_cast_fp16)[name = tensor("hidden_states_119_cast_fp16")]; tensor hidden_states_121_cast_fp16 = add(x = input_199_cast_fp16, y = hidden_states_119_cast_fp16)[name = tensor("hidden_states_121_cast_fp16")]; tensor reshape_96_shape_0 = const()[name = tensor("reshape_96_shape_0"), val = tensor([2, 32, 40, 6, 6])]; tensor reshape_96_cast_fp16 = reshape(shape = reshape_96_shape_0, x = hidden_states_121_cast_fp16)[name = tensor("reshape_96_cast_fp16")]; tensor reduce_mean_72_axes_0 = const()[name = tensor("reduce_mean_72_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_72_keep_dims_0 = const()[name = tensor("reduce_mean_72_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_72_cast_fp16 = reduce_mean(axes = reduce_mean_72_axes_0, keep_dims = reduce_mean_72_keep_dims_0, x = reshape_96_cast_fp16)[name = tensor("reduce_mean_72_cast_fp16")]; tensor sub_48_cast_fp16 = sub(x = reshape_96_cast_fp16, y = reduce_mean_72_cast_fp16)[name = tensor("sub_48_cast_fp16")]; tensor square_24_cast_fp16 = square(x = sub_48_cast_fp16)[name = tensor("square_24_cast_fp16")]; tensor reduce_mean_74_axes_0 = const()[name = tensor("reduce_mean_74_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_74_keep_dims_0 = const()[name = tensor("reduce_mean_74_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_74_cast_fp16 = reduce_mean(axes = reduce_mean_74_axes_0, keep_dims = reduce_mean_74_keep_dims_0, x = square_24_cast_fp16)[name = tensor("reduce_mean_74_cast_fp16")]; tensor add_48_y_0_to_fp16 = const()[name = tensor("add_48_y_0_to_fp16"), val = tensor(0x1.1p-20)]; tensor add_48_cast_fp16 = add(x = reduce_mean_74_cast_fp16, y = add_48_y_0_to_fp16)[name = tensor("add_48_cast_fp16")]; tensor sqrt_24_cast_fp16 = sqrt(x = add_48_cast_fp16)[name = tensor("sqrt_24_cast_fp16")]; tensor real_div_24_cast_fp16 = real_div(x = sub_48_cast_fp16, y = sqrt_24_cast_fp16)[name = tensor("real_div_24_cast_fp16")]; tensor reshape_97_shape_0 = const()[name = tensor("reshape_97_shape_0"), val = tensor([2, 1280, 6, 6])]; tensor reshape_97_cast_fp16 = reshape(shape = reshape_97_shape_0, x = real_div_24_cast_fp16)[name = tensor("reshape_97_cast_fp16")]; tensor add_49_gamma_0_to_fp16 = const()[name = tensor("add_49_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570240960)))]; tensor add_49_beta_0_to_fp16 = const()[name = tensor("add_49_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570243584)))]; tensor add_49_epsilon_0_to_fp16 = const()[name = tensor("add_49_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_49_cast_fp16 = batch_norm(beta = add_49_beta_0_to_fp16, epsilon = add_49_epsilon_0_to_fp16, gamma = add_49_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_97_cast_fp16)[name = tensor("add_49_cast_fp16")]; tensor var_4431 = const()[name = tensor("op_4431"), val = tensor([1, 1])]; tensor var_4433 = const()[name = tensor("op_4433"), val = tensor([1, 1])]; tensor hidden_states_123_pad_type_0 = const()[name = tensor("hidden_states_123_pad_type_0"), val = tensor("custom")]; tensor hidden_states_123_pad_0 = const()[name = tensor("hidden_states_123_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_proj_in_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_proj_in_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570246208)))]; tensor mid_block_attentions_0_proj_in_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_proj_in_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(573523072)))]; tensor hidden_states_123_cast_fp16 = conv(bias = mid_block_attentions_0_proj_in_bias_to_fp16, dilations = var_4433, groups = var_4371, pad = hidden_states_123_pad_0, pad_type = hidden_states_123_pad_type_0, strides = var_4431, weight = mid_block_attentions_0_proj_in_weight_to_fp16, x = add_49_cast_fp16)[name = tensor("hidden_states_123_cast_fp16")]; tensor var_4438 = const()[name = tensor("op_4438"), val = tensor([2, 1280, 1, 36])]; tensor inputs_37_cast_fp16 = reshape(shape = var_4438, x = hidden_states_123_cast_fp16)[name = tensor("inputs_37_cast_fp16")]; tensor var_4448 = const()[name = tensor("op_4448"), val = tensor([1])]; tensor channels_mean_37_cast_fp16 = reduce_mean(axes = var_4448, keep_dims = var_4366, x = inputs_37_cast_fp16)[name = tensor("channels_mean_37_cast_fp16")]; tensor zero_mean_37_cast_fp16 = sub(x = inputs_37_cast_fp16, y = channels_mean_37_cast_fp16)[name = tensor("zero_mean_37_cast_fp16")]; tensor zero_mean_sq_37_cast_fp16 = mul(x = zero_mean_37_cast_fp16, y = zero_mean_37_cast_fp16)[name = tensor("zero_mean_sq_37_cast_fp16")]; tensor var_4452 = const()[name = tensor("op_4452"), val = tensor([1])]; tensor var_4453_cast_fp16 = reduce_mean(axes = var_4452, keep_dims = var_4366, x = zero_mean_sq_37_cast_fp16)[name = tensor("op_4453_cast_fp16")]; tensor var_4454_to_fp16 = const()[name = tensor("op_4454_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4455_cast_fp16 = add(x = var_4453_cast_fp16, y = var_4454_to_fp16)[name = tensor("op_4455_cast_fp16")]; tensor denom_37_epsilon_0_to_fp16 = const()[name = tensor("denom_37_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_37_cast_fp16 = rsqrt(epsilon = denom_37_epsilon_0_to_fp16, x = var_4455_cast_fp16)[name = tensor("denom_37_cast_fp16")]; tensor out_37_cast_fp16 = mul(x = zero_mean_37_cast_fp16, y = denom_37_cast_fp16)[name = tensor("out_37_cast_fp16")]; tensor var_4459_to_fp16 = const()[name = tensor("op_4459_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(573525696)))]; tensor var_4460_cast_fp16 = add(x = out_37_cast_fp16, y = var_4459_to_fp16)[name = tensor("op_4460_cast_fp16")]; tensor var_4462_to_fp16 = const()[name = tensor("op_4462_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(573528320)))]; tensor hidden_states_125_cast_fp16 = mul(x = var_4460_cast_fp16, y = var_4462_to_fp16)[name = tensor("hidden_states_125_cast_fp16")]; tensor var_4469 = const()[name = tensor("op_4469"), val = tensor([1, 1])]; tensor var_4471 = const()[name = tensor("op_4471"), val = tensor([1, 1])]; tensor q_25_pad_type_0 = const()[name = tensor("q_25_pad_type_0"), val = tensor("custom")]; tensor q_25_pad_0 = const()[name = tensor("q_25_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(573530944)))]; tensor q_25_cast_fp16 = conv(dilations = var_4471, groups = var_4371, pad = q_25_pad_0, pad_type = q_25_pad_type_0, strides = var_4469, weight = mid_block_attentions_0_transformer_blocks_0_attn1_to_q_weight_to_fp16, x = hidden_states_125_cast_fp16)[name = tensor("q_25_cast_fp16")]; tensor var_4475 = const()[name = tensor("op_4475"), val = tensor([1, 1])]; tensor var_4477 = const()[name = tensor("op_4477"), val = tensor([1, 1])]; tensor k_49_pad_type_0 = const()[name = tensor("k_49_pad_type_0"), val = tensor("custom")]; tensor k_49_pad_0 = const()[name = tensor("k_49_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(576807808)))]; tensor k_49_cast_fp16 = conv(dilations = var_4477, groups = var_4371, pad = k_49_pad_0, pad_type = k_49_pad_type_0, strides = var_4475, weight = mid_block_attentions_0_transformer_blocks_0_attn1_to_k_weight_to_fp16, x = hidden_states_125_cast_fp16)[name = tensor("k_49_cast_fp16")]; tensor var_4481 = const()[name = tensor("op_4481"), val = tensor([1, 1])]; tensor var_4483 = const()[name = tensor("op_4483"), val = tensor([1, 1])]; tensor v_25_pad_type_0 = const()[name = tensor("v_25_pad_type_0"), val = tensor("custom")]; tensor v_25_pad_0 = const()[name = tensor("v_25_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(580084672)))]; tensor v_25_cast_fp16 = conv(dilations = var_4483, groups = var_4371, pad = v_25_pad_0, pad_type = v_25_pad_type_0, strides = var_4481, weight = mid_block_attentions_0_transformer_blocks_0_attn1_to_v_weight_to_fp16, x = hidden_states_125_cast_fp16)[name = tensor("v_25_cast_fp16")]; tensor var_4487_begin_0 = const()[name = tensor("op_4487_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_4487_end_0 = const()[name = tensor("op_4487_end_0"), val = tensor([2, 64, 1, 36])]; tensor var_4487_end_mask_0 = const()[name = tensor("op_4487_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4487_cast_fp16 = slice_by_index(begin = var_4487_begin_0, end = var_4487_end_0, end_mask = var_4487_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4487_cast_fp16")]; tensor var_4491_begin_0 = const()[name = tensor("op_4491_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_4491_end_0 = const()[name = tensor("op_4491_end_0"), val = tensor([2, 128, 1, 36])]; tensor var_4491_end_mask_0 = const()[name = tensor("op_4491_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4491_cast_fp16 = slice_by_index(begin = var_4491_begin_0, end = var_4491_end_0, end_mask = var_4491_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4491_cast_fp16")]; tensor var_4495_begin_0 = const()[name = tensor("op_4495_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_4495_end_0 = const()[name = tensor("op_4495_end_0"), val = tensor([2, 192, 1, 36])]; tensor var_4495_end_mask_0 = const()[name = tensor("op_4495_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4495_cast_fp16 = slice_by_index(begin = var_4495_begin_0, end = var_4495_end_0, end_mask = var_4495_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4495_cast_fp16")]; tensor var_4499_begin_0 = const()[name = tensor("op_4499_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_4499_end_0 = const()[name = tensor("op_4499_end_0"), val = tensor([2, 256, 1, 36])]; tensor var_4499_end_mask_0 = const()[name = tensor("op_4499_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4499_cast_fp16 = slice_by_index(begin = var_4499_begin_0, end = var_4499_end_0, end_mask = var_4499_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4499_cast_fp16")]; tensor var_4503_begin_0 = const()[name = tensor("op_4503_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_4503_end_0 = const()[name = tensor("op_4503_end_0"), val = tensor([2, 320, 1, 36])]; tensor var_4503_end_mask_0 = const()[name = tensor("op_4503_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4503_cast_fp16 = slice_by_index(begin = var_4503_begin_0, end = var_4503_end_0, end_mask = var_4503_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4503_cast_fp16")]; tensor var_4507_begin_0 = const()[name = tensor("op_4507_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_4507_end_0 = const()[name = tensor("op_4507_end_0"), val = tensor([2, 384, 1, 36])]; tensor var_4507_end_mask_0 = const()[name = tensor("op_4507_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4507_cast_fp16 = slice_by_index(begin = var_4507_begin_0, end = var_4507_end_0, end_mask = var_4507_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4507_cast_fp16")]; tensor var_4511_begin_0 = const()[name = tensor("op_4511_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_4511_end_0 = const()[name = tensor("op_4511_end_0"), val = tensor([2, 448, 1, 36])]; tensor var_4511_end_mask_0 = const()[name = tensor("op_4511_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4511_cast_fp16 = slice_by_index(begin = var_4511_begin_0, end = var_4511_end_0, end_mask = var_4511_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4511_cast_fp16")]; tensor var_4515_begin_0 = const()[name = tensor("op_4515_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_4515_end_0 = const()[name = tensor("op_4515_end_0"), val = tensor([2, 512, 1, 36])]; tensor var_4515_end_mask_0 = const()[name = tensor("op_4515_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4515_cast_fp16 = slice_by_index(begin = var_4515_begin_0, end = var_4515_end_0, end_mask = var_4515_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4515_cast_fp16")]; tensor var_4519_begin_0 = const()[name = tensor("op_4519_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_4519_end_0 = const()[name = tensor("op_4519_end_0"), val = tensor([2, 576, 1, 36])]; tensor var_4519_end_mask_0 = const()[name = tensor("op_4519_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4519_cast_fp16 = slice_by_index(begin = var_4519_begin_0, end = var_4519_end_0, end_mask = var_4519_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4519_cast_fp16")]; tensor var_4523_begin_0 = const()[name = tensor("op_4523_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_4523_end_0 = const()[name = tensor("op_4523_end_0"), val = tensor([2, 640, 1, 36])]; tensor var_4523_end_mask_0 = const()[name = tensor("op_4523_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4523_cast_fp16 = slice_by_index(begin = var_4523_begin_0, end = var_4523_end_0, end_mask = var_4523_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4523_cast_fp16")]; tensor var_4527_begin_0 = const()[name = tensor("op_4527_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_4527_end_0 = const()[name = tensor("op_4527_end_0"), val = tensor([2, 704, 1, 36])]; tensor var_4527_end_mask_0 = const()[name = tensor("op_4527_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4527_cast_fp16 = slice_by_index(begin = var_4527_begin_0, end = var_4527_end_0, end_mask = var_4527_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4527_cast_fp16")]; tensor var_4531_begin_0 = const()[name = tensor("op_4531_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_4531_end_0 = const()[name = tensor("op_4531_end_0"), val = tensor([2, 768, 1, 36])]; tensor var_4531_end_mask_0 = const()[name = tensor("op_4531_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4531_cast_fp16 = slice_by_index(begin = var_4531_begin_0, end = var_4531_end_0, end_mask = var_4531_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4531_cast_fp16")]; tensor var_4535_begin_0 = const()[name = tensor("op_4535_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_4535_end_0 = const()[name = tensor("op_4535_end_0"), val = tensor([2, 832, 1, 36])]; tensor var_4535_end_mask_0 = const()[name = tensor("op_4535_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4535_cast_fp16 = slice_by_index(begin = var_4535_begin_0, end = var_4535_end_0, end_mask = var_4535_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4535_cast_fp16")]; tensor var_4539_begin_0 = const()[name = tensor("op_4539_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_4539_end_0 = const()[name = tensor("op_4539_end_0"), val = tensor([2, 896, 1, 36])]; tensor var_4539_end_mask_0 = const()[name = tensor("op_4539_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4539_cast_fp16 = slice_by_index(begin = var_4539_begin_0, end = var_4539_end_0, end_mask = var_4539_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4539_cast_fp16")]; tensor var_4543_begin_0 = const()[name = tensor("op_4543_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_4543_end_0 = const()[name = tensor("op_4543_end_0"), val = tensor([2, 960, 1, 36])]; tensor var_4543_end_mask_0 = const()[name = tensor("op_4543_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4543_cast_fp16 = slice_by_index(begin = var_4543_begin_0, end = var_4543_end_0, end_mask = var_4543_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4543_cast_fp16")]; tensor var_4547_begin_0 = const()[name = tensor("op_4547_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_4547_end_0 = const()[name = tensor("op_4547_end_0"), val = tensor([2, 1024, 1, 36])]; tensor var_4547_end_mask_0 = const()[name = tensor("op_4547_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4547_cast_fp16 = slice_by_index(begin = var_4547_begin_0, end = var_4547_end_0, end_mask = var_4547_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4547_cast_fp16")]; tensor var_4551_begin_0 = const()[name = tensor("op_4551_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_4551_end_0 = const()[name = tensor("op_4551_end_0"), val = tensor([2, 1088, 1, 36])]; tensor var_4551_end_mask_0 = const()[name = tensor("op_4551_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4551_cast_fp16 = slice_by_index(begin = var_4551_begin_0, end = var_4551_end_0, end_mask = var_4551_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4551_cast_fp16")]; tensor var_4555_begin_0 = const()[name = tensor("op_4555_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_4555_end_0 = const()[name = tensor("op_4555_end_0"), val = tensor([2, 1152, 1, 36])]; tensor var_4555_end_mask_0 = const()[name = tensor("op_4555_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4555_cast_fp16 = slice_by_index(begin = var_4555_begin_0, end = var_4555_end_0, end_mask = var_4555_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4555_cast_fp16")]; tensor var_4559_begin_0 = const()[name = tensor("op_4559_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_4559_end_0 = const()[name = tensor("op_4559_end_0"), val = tensor([2, 1216, 1, 36])]; tensor var_4559_end_mask_0 = const()[name = tensor("op_4559_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4559_cast_fp16 = slice_by_index(begin = var_4559_begin_0, end = var_4559_end_0, end_mask = var_4559_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4559_cast_fp16")]; tensor var_4563_begin_0 = const()[name = tensor("op_4563_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_4563_end_0 = const()[name = tensor("op_4563_end_0"), val = tensor([2, 1280, 1, 36])]; tensor var_4563_end_mask_0 = const()[name = tensor("op_4563_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4563_cast_fp16 = slice_by_index(begin = var_4563_begin_0, end = var_4563_end_0, end_mask = var_4563_end_mask_0, x = q_25_cast_fp16)[name = tensor("op_4563_cast_fp16")]; tensor k_51_perm_0 = const()[name = tensor("k_51_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_4570_begin_0 = const()[name = tensor("op_4570_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_4570_end_0 = const()[name = tensor("op_4570_end_0"), val = tensor([2, 36, 1, 64])]; tensor var_4570_end_mask_0 = const()[name = tensor("op_4570_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_1 = transpose(perm = k_51_perm_0, x = k_49_cast_fp16)[name = tensor("transpose_1")]; tensor var_4570_cast_fp16 = slice_by_index(begin = var_4570_begin_0, end = var_4570_end_0, end_mask = var_4570_end_mask_0, x = transpose_1)[name = tensor("op_4570_cast_fp16")]; tensor var_4574_begin_0 = const()[name = tensor("op_4574_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_4574_end_0 = const()[name = tensor("op_4574_end_0"), val = tensor([2, 36, 1, 128])]; tensor var_4574_end_mask_0 = const()[name = tensor("op_4574_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4574_cast_fp16 = slice_by_index(begin = var_4574_begin_0, end = var_4574_end_0, end_mask = var_4574_end_mask_0, x = transpose_1)[name = tensor("op_4574_cast_fp16")]; tensor var_4578_begin_0 = const()[name = tensor("op_4578_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_4578_end_0 = const()[name = tensor("op_4578_end_0"), val = tensor([2, 36, 1, 192])]; tensor var_4578_end_mask_0 = const()[name = tensor("op_4578_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4578_cast_fp16 = slice_by_index(begin = var_4578_begin_0, end = var_4578_end_0, end_mask = var_4578_end_mask_0, x = transpose_1)[name = tensor("op_4578_cast_fp16")]; tensor var_4582_begin_0 = const()[name = tensor("op_4582_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_4582_end_0 = const()[name = tensor("op_4582_end_0"), val = tensor([2, 36, 1, 256])]; tensor var_4582_end_mask_0 = const()[name = tensor("op_4582_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4582_cast_fp16 = slice_by_index(begin = var_4582_begin_0, end = var_4582_end_0, end_mask = var_4582_end_mask_0, x = transpose_1)[name = tensor("op_4582_cast_fp16")]; tensor var_4586_begin_0 = const()[name = tensor("op_4586_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_4586_end_0 = const()[name = tensor("op_4586_end_0"), val = tensor([2, 36, 1, 320])]; tensor var_4586_end_mask_0 = const()[name = tensor("op_4586_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4586_cast_fp16 = slice_by_index(begin = var_4586_begin_0, end = var_4586_end_0, end_mask = var_4586_end_mask_0, x = transpose_1)[name = tensor("op_4586_cast_fp16")]; tensor var_4590_begin_0 = const()[name = tensor("op_4590_begin_0"), val = tensor([0, 0, 0, 320])]; tensor var_4590_end_0 = const()[name = tensor("op_4590_end_0"), val = tensor([2, 36, 1, 384])]; tensor var_4590_end_mask_0 = const()[name = tensor("op_4590_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4590_cast_fp16 = slice_by_index(begin = var_4590_begin_0, end = var_4590_end_0, end_mask = var_4590_end_mask_0, x = transpose_1)[name = tensor("op_4590_cast_fp16")]; tensor var_4594_begin_0 = const()[name = tensor("op_4594_begin_0"), val = tensor([0, 0, 0, 384])]; tensor var_4594_end_0 = const()[name = tensor("op_4594_end_0"), val = tensor([2, 36, 1, 448])]; tensor var_4594_end_mask_0 = const()[name = tensor("op_4594_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4594_cast_fp16 = slice_by_index(begin = var_4594_begin_0, end = var_4594_end_0, end_mask = var_4594_end_mask_0, x = transpose_1)[name = tensor("op_4594_cast_fp16")]; tensor var_4598_begin_0 = const()[name = tensor("op_4598_begin_0"), val = tensor([0, 0, 0, 448])]; tensor var_4598_end_0 = const()[name = tensor("op_4598_end_0"), val = tensor([2, 36, 1, 512])]; tensor var_4598_end_mask_0 = const()[name = tensor("op_4598_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4598_cast_fp16 = slice_by_index(begin = var_4598_begin_0, end = var_4598_end_0, end_mask = var_4598_end_mask_0, x = transpose_1)[name = tensor("op_4598_cast_fp16")]; tensor var_4602_begin_0 = const()[name = tensor("op_4602_begin_0"), val = tensor([0, 0, 0, 512])]; tensor var_4602_end_0 = const()[name = tensor("op_4602_end_0"), val = tensor([2, 36, 1, 576])]; tensor var_4602_end_mask_0 = const()[name = tensor("op_4602_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4602_cast_fp16 = slice_by_index(begin = var_4602_begin_0, end = var_4602_end_0, end_mask = var_4602_end_mask_0, x = transpose_1)[name = tensor("op_4602_cast_fp16")]; tensor var_4606_begin_0 = const()[name = tensor("op_4606_begin_0"), val = tensor([0, 0, 0, 576])]; tensor var_4606_end_0 = const()[name = tensor("op_4606_end_0"), val = tensor([2, 36, 1, 640])]; tensor var_4606_end_mask_0 = const()[name = tensor("op_4606_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4606_cast_fp16 = slice_by_index(begin = var_4606_begin_0, end = var_4606_end_0, end_mask = var_4606_end_mask_0, x = transpose_1)[name = tensor("op_4606_cast_fp16")]; tensor var_4610_begin_0 = const()[name = tensor("op_4610_begin_0"), val = tensor([0, 0, 0, 640])]; tensor var_4610_end_0 = const()[name = tensor("op_4610_end_0"), val = tensor([2, 36, 1, 704])]; tensor var_4610_end_mask_0 = const()[name = tensor("op_4610_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4610_cast_fp16 = slice_by_index(begin = var_4610_begin_0, end = var_4610_end_0, end_mask = var_4610_end_mask_0, x = transpose_1)[name = tensor("op_4610_cast_fp16")]; tensor var_4614_begin_0 = const()[name = tensor("op_4614_begin_0"), val = tensor([0, 0, 0, 704])]; tensor var_4614_end_0 = const()[name = tensor("op_4614_end_0"), val = tensor([2, 36, 1, 768])]; tensor var_4614_end_mask_0 = const()[name = tensor("op_4614_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4614_cast_fp16 = slice_by_index(begin = var_4614_begin_0, end = var_4614_end_0, end_mask = var_4614_end_mask_0, x = transpose_1)[name = tensor("op_4614_cast_fp16")]; tensor var_4618_begin_0 = const()[name = tensor("op_4618_begin_0"), val = tensor([0, 0, 0, 768])]; tensor var_4618_end_0 = const()[name = tensor("op_4618_end_0"), val = tensor([2, 36, 1, 832])]; tensor var_4618_end_mask_0 = const()[name = tensor("op_4618_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4618_cast_fp16 = slice_by_index(begin = var_4618_begin_0, end = var_4618_end_0, end_mask = var_4618_end_mask_0, x = transpose_1)[name = tensor("op_4618_cast_fp16")]; tensor var_4622_begin_0 = const()[name = tensor("op_4622_begin_0"), val = tensor([0, 0, 0, 832])]; tensor var_4622_end_0 = const()[name = tensor("op_4622_end_0"), val = tensor([2, 36, 1, 896])]; tensor var_4622_end_mask_0 = const()[name = tensor("op_4622_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4622_cast_fp16 = slice_by_index(begin = var_4622_begin_0, end = var_4622_end_0, end_mask = var_4622_end_mask_0, x = transpose_1)[name = tensor("op_4622_cast_fp16")]; tensor var_4626_begin_0 = const()[name = tensor("op_4626_begin_0"), val = tensor([0, 0, 0, 896])]; tensor var_4626_end_0 = const()[name = tensor("op_4626_end_0"), val = tensor([2, 36, 1, 960])]; tensor var_4626_end_mask_0 = const()[name = tensor("op_4626_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4626_cast_fp16 = slice_by_index(begin = var_4626_begin_0, end = var_4626_end_0, end_mask = var_4626_end_mask_0, x = transpose_1)[name = tensor("op_4626_cast_fp16")]; tensor var_4630_begin_0 = const()[name = tensor("op_4630_begin_0"), val = tensor([0, 0, 0, 960])]; tensor var_4630_end_0 = const()[name = tensor("op_4630_end_0"), val = tensor([2, 36, 1, 1024])]; tensor var_4630_end_mask_0 = const()[name = tensor("op_4630_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4630_cast_fp16 = slice_by_index(begin = var_4630_begin_0, end = var_4630_end_0, end_mask = var_4630_end_mask_0, x = transpose_1)[name = tensor("op_4630_cast_fp16")]; tensor var_4634_begin_0 = const()[name = tensor("op_4634_begin_0"), val = tensor([0, 0, 0, 1024])]; tensor var_4634_end_0 = const()[name = tensor("op_4634_end_0"), val = tensor([2, 36, 1, 1088])]; tensor var_4634_end_mask_0 = const()[name = tensor("op_4634_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4634_cast_fp16 = slice_by_index(begin = var_4634_begin_0, end = var_4634_end_0, end_mask = var_4634_end_mask_0, x = transpose_1)[name = tensor("op_4634_cast_fp16")]; tensor var_4638_begin_0 = const()[name = tensor("op_4638_begin_0"), val = tensor([0, 0, 0, 1088])]; tensor var_4638_end_0 = const()[name = tensor("op_4638_end_0"), val = tensor([2, 36, 1, 1152])]; tensor var_4638_end_mask_0 = const()[name = tensor("op_4638_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4638_cast_fp16 = slice_by_index(begin = var_4638_begin_0, end = var_4638_end_0, end_mask = var_4638_end_mask_0, x = transpose_1)[name = tensor("op_4638_cast_fp16")]; tensor var_4642_begin_0 = const()[name = tensor("op_4642_begin_0"), val = tensor([0, 0, 0, 1152])]; tensor var_4642_end_0 = const()[name = tensor("op_4642_end_0"), val = tensor([2, 36, 1, 1216])]; tensor var_4642_end_mask_0 = const()[name = tensor("op_4642_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4642_cast_fp16 = slice_by_index(begin = var_4642_begin_0, end = var_4642_end_0, end_mask = var_4642_end_mask_0, x = transpose_1)[name = tensor("op_4642_cast_fp16")]; tensor var_4646_begin_0 = const()[name = tensor("op_4646_begin_0"), val = tensor([0, 0, 0, 1216])]; tensor var_4646_end_0 = const()[name = tensor("op_4646_end_0"), val = tensor([2, 36, 1, 1280])]; tensor var_4646_end_mask_0 = const()[name = tensor("op_4646_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_4646_cast_fp16 = slice_by_index(begin = var_4646_begin_0, end = var_4646_end_0, end_mask = var_4646_end_mask_0, x = transpose_1)[name = tensor("op_4646_cast_fp16")]; tensor var_4648_begin_0 = const()[name = tensor("op_4648_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_4648_end_0 = const()[name = tensor("op_4648_end_0"), val = tensor([2, 64, 1, 36])]; tensor var_4648_end_mask_0 = const()[name = tensor("op_4648_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4648_cast_fp16 = slice_by_index(begin = var_4648_begin_0, end = var_4648_end_0, end_mask = var_4648_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4648_cast_fp16")]; tensor var_4652_begin_0 = const()[name = tensor("op_4652_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_4652_end_0 = const()[name = tensor("op_4652_end_0"), val = tensor([2, 128, 1, 36])]; tensor var_4652_end_mask_0 = const()[name = tensor("op_4652_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4652_cast_fp16 = slice_by_index(begin = var_4652_begin_0, end = var_4652_end_0, end_mask = var_4652_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4652_cast_fp16")]; tensor var_4656_begin_0 = const()[name = tensor("op_4656_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_4656_end_0 = const()[name = tensor("op_4656_end_0"), val = tensor([2, 192, 1, 36])]; tensor var_4656_end_mask_0 = const()[name = tensor("op_4656_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4656_cast_fp16 = slice_by_index(begin = var_4656_begin_0, end = var_4656_end_0, end_mask = var_4656_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4656_cast_fp16")]; tensor var_4660_begin_0 = const()[name = tensor("op_4660_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_4660_end_0 = const()[name = tensor("op_4660_end_0"), val = tensor([2, 256, 1, 36])]; tensor var_4660_end_mask_0 = const()[name = tensor("op_4660_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4660_cast_fp16 = slice_by_index(begin = var_4660_begin_0, end = var_4660_end_0, end_mask = var_4660_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4660_cast_fp16")]; tensor var_4664_begin_0 = const()[name = tensor("op_4664_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_4664_end_0 = const()[name = tensor("op_4664_end_0"), val = tensor([2, 320, 1, 36])]; tensor var_4664_end_mask_0 = const()[name = tensor("op_4664_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4664_cast_fp16 = slice_by_index(begin = var_4664_begin_0, end = var_4664_end_0, end_mask = var_4664_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4664_cast_fp16")]; tensor var_4668_begin_0 = const()[name = tensor("op_4668_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_4668_end_0 = const()[name = tensor("op_4668_end_0"), val = tensor([2, 384, 1, 36])]; tensor var_4668_end_mask_0 = const()[name = tensor("op_4668_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4668_cast_fp16 = slice_by_index(begin = var_4668_begin_0, end = var_4668_end_0, end_mask = var_4668_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4668_cast_fp16")]; tensor var_4672_begin_0 = const()[name = tensor("op_4672_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_4672_end_0 = const()[name = tensor("op_4672_end_0"), val = tensor([2, 448, 1, 36])]; tensor var_4672_end_mask_0 = const()[name = tensor("op_4672_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4672_cast_fp16 = slice_by_index(begin = var_4672_begin_0, end = var_4672_end_0, end_mask = var_4672_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4672_cast_fp16")]; tensor var_4676_begin_0 = const()[name = tensor("op_4676_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_4676_end_0 = const()[name = tensor("op_4676_end_0"), val = tensor([2, 512, 1, 36])]; tensor var_4676_end_mask_0 = const()[name = tensor("op_4676_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4676_cast_fp16 = slice_by_index(begin = var_4676_begin_0, end = var_4676_end_0, end_mask = var_4676_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4676_cast_fp16")]; tensor var_4680_begin_0 = const()[name = tensor("op_4680_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_4680_end_0 = const()[name = tensor("op_4680_end_0"), val = tensor([2, 576, 1, 36])]; tensor var_4680_end_mask_0 = const()[name = tensor("op_4680_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4680_cast_fp16 = slice_by_index(begin = var_4680_begin_0, end = var_4680_end_0, end_mask = var_4680_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4680_cast_fp16")]; tensor var_4684_begin_0 = const()[name = tensor("op_4684_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_4684_end_0 = const()[name = tensor("op_4684_end_0"), val = tensor([2, 640, 1, 36])]; tensor var_4684_end_mask_0 = const()[name = tensor("op_4684_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4684_cast_fp16 = slice_by_index(begin = var_4684_begin_0, end = var_4684_end_0, end_mask = var_4684_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4684_cast_fp16")]; tensor var_4688_begin_0 = const()[name = tensor("op_4688_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_4688_end_0 = const()[name = tensor("op_4688_end_0"), val = tensor([2, 704, 1, 36])]; tensor var_4688_end_mask_0 = const()[name = tensor("op_4688_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4688_cast_fp16 = slice_by_index(begin = var_4688_begin_0, end = var_4688_end_0, end_mask = var_4688_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4688_cast_fp16")]; tensor var_4692_begin_0 = const()[name = tensor("op_4692_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_4692_end_0 = const()[name = tensor("op_4692_end_0"), val = tensor([2, 768, 1, 36])]; tensor var_4692_end_mask_0 = const()[name = tensor("op_4692_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4692_cast_fp16 = slice_by_index(begin = var_4692_begin_0, end = var_4692_end_0, end_mask = var_4692_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4692_cast_fp16")]; tensor var_4696_begin_0 = const()[name = tensor("op_4696_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_4696_end_0 = const()[name = tensor("op_4696_end_0"), val = tensor([2, 832, 1, 36])]; tensor var_4696_end_mask_0 = const()[name = tensor("op_4696_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4696_cast_fp16 = slice_by_index(begin = var_4696_begin_0, end = var_4696_end_0, end_mask = var_4696_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4696_cast_fp16")]; tensor var_4700_begin_0 = const()[name = tensor("op_4700_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_4700_end_0 = const()[name = tensor("op_4700_end_0"), val = tensor([2, 896, 1, 36])]; tensor var_4700_end_mask_0 = const()[name = tensor("op_4700_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4700_cast_fp16 = slice_by_index(begin = var_4700_begin_0, end = var_4700_end_0, end_mask = var_4700_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4700_cast_fp16")]; tensor var_4704_begin_0 = const()[name = tensor("op_4704_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_4704_end_0 = const()[name = tensor("op_4704_end_0"), val = tensor([2, 960, 1, 36])]; tensor var_4704_end_mask_0 = const()[name = tensor("op_4704_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4704_cast_fp16 = slice_by_index(begin = var_4704_begin_0, end = var_4704_end_0, end_mask = var_4704_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4704_cast_fp16")]; tensor var_4708_begin_0 = const()[name = tensor("op_4708_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_4708_end_0 = const()[name = tensor("op_4708_end_0"), val = tensor([2, 1024, 1, 36])]; tensor var_4708_end_mask_0 = const()[name = tensor("op_4708_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4708_cast_fp16 = slice_by_index(begin = var_4708_begin_0, end = var_4708_end_0, end_mask = var_4708_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4708_cast_fp16")]; tensor var_4712_begin_0 = const()[name = tensor("op_4712_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_4712_end_0 = const()[name = tensor("op_4712_end_0"), val = tensor([2, 1088, 1, 36])]; tensor var_4712_end_mask_0 = const()[name = tensor("op_4712_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4712_cast_fp16 = slice_by_index(begin = var_4712_begin_0, end = var_4712_end_0, end_mask = var_4712_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4712_cast_fp16")]; tensor var_4716_begin_0 = const()[name = tensor("op_4716_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_4716_end_0 = const()[name = tensor("op_4716_end_0"), val = tensor([2, 1152, 1, 36])]; tensor var_4716_end_mask_0 = const()[name = tensor("op_4716_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4716_cast_fp16 = slice_by_index(begin = var_4716_begin_0, end = var_4716_end_0, end_mask = var_4716_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4716_cast_fp16")]; tensor var_4720_begin_0 = const()[name = tensor("op_4720_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_4720_end_0 = const()[name = tensor("op_4720_end_0"), val = tensor([2, 1216, 1, 36])]; tensor var_4720_end_mask_0 = const()[name = tensor("op_4720_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4720_cast_fp16 = slice_by_index(begin = var_4720_begin_0, end = var_4720_end_0, end_mask = var_4720_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4720_cast_fp16")]; tensor var_4724_begin_0 = const()[name = tensor("op_4724_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_4724_end_0 = const()[name = tensor("op_4724_end_0"), val = tensor([2, 1280, 1, 36])]; tensor var_4724_end_mask_0 = const()[name = tensor("op_4724_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4724_cast_fp16 = slice_by_index(begin = var_4724_begin_0, end = var_4724_end_0, end_mask = var_4724_end_mask_0, x = v_25_cast_fp16)[name = tensor("op_4724_cast_fp16")]; tensor var_4728_equation_0 = const()[name = tensor("op_4728_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4728_cast_fp16 = einsum(equation = var_4728_equation_0, values = (var_4570_cast_fp16, var_4487_cast_fp16))[name = tensor("op_4728_cast_fp16")]; tensor var_4729_to_fp16 = const()[name = tensor("op_4729_to_fp16"), val = tensor(0x1p-3)]; tensor aw_281_cast_fp16 = mul(x = var_4728_cast_fp16, y = var_4729_to_fp16)[name = tensor("aw_281_cast_fp16")]; tensor var_4732_equation_0 = const()[name = tensor("op_4732_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4732_cast_fp16 = einsum(equation = var_4732_equation_0, values = (var_4574_cast_fp16, var_4491_cast_fp16))[name = tensor("op_4732_cast_fp16")]; tensor var_4733_to_fp16 = const()[name = tensor("op_4733_to_fp16"), val = tensor(0x1p-3)]; tensor aw_283_cast_fp16 = mul(x = var_4732_cast_fp16, y = var_4733_to_fp16)[name = tensor("aw_283_cast_fp16")]; tensor var_4736_equation_0 = const()[name = tensor("op_4736_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4736_cast_fp16 = einsum(equation = var_4736_equation_0, values = (var_4578_cast_fp16, var_4495_cast_fp16))[name = tensor("op_4736_cast_fp16")]; tensor var_4737_to_fp16 = const()[name = tensor("op_4737_to_fp16"), val = tensor(0x1p-3)]; tensor aw_285_cast_fp16 = mul(x = var_4736_cast_fp16, y = var_4737_to_fp16)[name = tensor("aw_285_cast_fp16")]; tensor var_4740_equation_0 = const()[name = tensor("op_4740_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4740_cast_fp16 = einsum(equation = var_4740_equation_0, values = (var_4582_cast_fp16, var_4499_cast_fp16))[name = tensor("op_4740_cast_fp16")]; tensor var_4741_to_fp16 = const()[name = tensor("op_4741_to_fp16"), val = tensor(0x1p-3)]; tensor aw_287_cast_fp16 = mul(x = var_4740_cast_fp16, y = var_4741_to_fp16)[name = tensor("aw_287_cast_fp16")]; tensor var_4744_equation_0 = const()[name = tensor("op_4744_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4744_cast_fp16 = einsum(equation = var_4744_equation_0, values = (var_4586_cast_fp16, var_4503_cast_fp16))[name = tensor("op_4744_cast_fp16")]; tensor var_4745_to_fp16 = const()[name = tensor("op_4745_to_fp16"), val = tensor(0x1p-3)]; tensor aw_289_cast_fp16 = mul(x = var_4744_cast_fp16, y = var_4745_to_fp16)[name = tensor("aw_289_cast_fp16")]; tensor var_4748_equation_0 = const()[name = tensor("op_4748_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4748_cast_fp16 = einsum(equation = var_4748_equation_0, values = (var_4590_cast_fp16, var_4507_cast_fp16))[name = tensor("op_4748_cast_fp16")]; tensor var_4749_to_fp16 = const()[name = tensor("op_4749_to_fp16"), val = tensor(0x1p-3)]; tensor aw_291_cast_fp16 = mul(x = var_4748_cast_fp16, y = var_4749_to_fp16)[name = tensor("aw_291_cast_fp16")]; tensor var_4752_equation_0 = const()[name = tensor("op_4752_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4752_cast_fp16 = einsum(equation = var_4752_equation_0, values = (var_4594_cast_fp16, var_4511_cast_fp16))[name = tensor("op_4752_cast_fp16")]; tensor var_4753_to_fp16 = const()[name = tensor("op_4753_to_fp16"), val = tensor(0x1p-3)]; tensor aw_293_cast_fp16 = mul(x = var_4752_cast_fp16, y = var_4753_to_fp16)[name = tensor("aw_293_cast_fp16")]; tensor var_4756_equation_0 = const()[name = tensor("op_4756_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4756_cast_fp16 = einsum(equation = var_4756_equation_0, values = (var_4598_cast_fp16, var_4515_cast_fp16))[name = tensor("op_4756_cast_fp16")]; tensor var_4757_to_fp16 = const()[name = tensor("op_4757_to_fp16"), val = tensor(0x1p-3)]; tensor aw_295_cast_fp16 = mul(x = var_4756_cast_fp16, y = var_4757_to_fp16)[name = tensor("aw_295_cast_fp16")]; tensor var_4760_equation_0 = const()[name = tensor("op_4760_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4760_cast_fp16 = einsum(equation = var_4760_equation_0, values = (var_4602_cast_fp16, var_4519_cast_fp16))[name = tensor("op_4760_cast_fp16")]; tensor var_4761_to_fp16 = const()[name = tensor("op_4761_to_fp16"), val = tensor(0x1p-3)]; tensor aw_297_cast_fp16 = mul(x = var_4760_cast_fp16, y = var_4761_to_fp16)[name = tensor("aw_297_cast_fp16")]; tensor var_4764_equation_0 = const()[name = tensor("op_4764_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4764_cast_fp16 = einsum(equation = var_4764_equation_0, values = (var_4606_cast_fp16, var_4523_cast_fp16))[name = tensor("op_4764_cast_fp16")]; tensor var_4765_to_fp16 = const()[name = tensor("op_4765_to_fp16"), val = tensor(0x1p-3)]; tensor aw_299_cast_fp16 = mul(x = var_4764_cast_fp16, y = var_4765_to_fp16)[name = tensor("aw_299_cast_fp16")]; tensor var_4768_equation_0 = const()[name = tensor("op_4768_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4768_cast_fp16 = einsum(equation = var_4768_equation_0, values = (var_4610_cast_fp16, var_4527_cast_fp16))[name = tensor("op_4768_cast_fp16")]; tensor var_4769_to_fp16 = const()[name = tensor("op_4769_to_fp16"), val = tensor(0x1p-3)]; tensor aw_301_cast_fp16 = mul(x = var_4768_cast_fp16, y = var_4769_to_fp16)[name = tensor("aw_301_cast_fp16")]; tensor var_4772_equation_0 = const()[name = tensor("op_4772_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4772_cast_fp16 = einsum(equation = var_4772_equation_0, values = (var_4614_cast_fp16, var_4531_cast_fp16))[name = tensor("op_4772_cast_fp16")]; tensor var_4773_to_fp16 = const()[name = tensor("op_4773_to_fp16"), val = tensor(0x1p-3)]; tensor aw_303_cast_fp16 = mul(x = var_4772_cast_fp16, y = var_4773_to_fp16)[name = tensor("aw_303_cast_fp16")]; tensor var_4776_equation_0 = const()[name = tensor("op_4776_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4776_cast_fp16 = einsum(equation = var_4776_equation_0, values = (var_4618_cast_fp16, var_4535_cast_fp16))[name = tensor("op_4776_cast_fp16")]; tensor var_4777_to_fp16 = const()[name = tensor("op_4777_to_fp16"), val = tensor(0x1p-3)]; tensor aw_305_cast_fp16 = mul(x = var_4776_cast_fp16, y = var_4777_to_fp16)[name = tensor("aw_305_cast_fp16")]; tensor var_4780_equation_0 = const()[name = tensor("op_4780_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4780_cast_fp16 = einsum(equation = var_4780_equation_0, values = (var_4622_cast_fp16, var_4539_cast_fp16))[name = tensor("op_4780_cast_fp16")]; tensor var_4781_to_fp16 = const()[name = tensor("op_4781_to_fp16"), val = tensor(0x1p-3)]; tensor aw_307_cast_fp16 = mul(x = var_4780_cast_fp16, y = var_4781_to_fp16)[name = tensor("aw_307_cast_fp16")]; tensor var_4784_equation_0 = const()[name = tensor("op_4784_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4784_cast_fp16 = einsum(equation = var_4784_equation_0, values = (var_4626_cast_fp16, var_4543_cast_fp16))[name = tensor("op_4784_cast_fp16")]; tensor var_4785_to_fp16 = const()[name = tensor("op_4785_to_fp16"), val = tensor(0x1p-3)]; tensor aw_309_cast_fp16 = mul(x = var_4784_cast_fp16, y = var_4785_to_fp16)[name = tensor("aw_309_cast_fp16")]; tensor var_4788_equation_0 = const()[name = tensor("op_4788_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4788_cast_fp16 = einsum(equation = var_4788_equation_0, values = (var_4630_cast_fp16, var_4547_cast_fp16))[name = tensor("op_4788_cast_fp16")]; tensor var_4789_to_fp16 = const()[name = tensor("op_4789_to_fp16"), val = tensor(0x1p-3)]; tensor aw_311_cast_fp16 = mul(x = var_4788_cast_fp16, y = var_4789_to_fp16)[name = tensor("aw_311_cast_fp16")]; tensor var_4792_equation_0 = const()[name = tensor("op_4792_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4792_cast_fp16 = einsum(equation = var_4792_equation_0, values = (var_4634_cast_fp16, var_4551_cast_fp16))[name = tensor("op_4792_cast_fp16")]; tensor var_4793_to_fp16 = const()[name = tensor("op_4793_to_fp16"), val = tensor(0x1p-3)]; tensor aw_313_cast_fp16 = mul(x = var_4792_cast_fp16, y = var_4793_to_fp16)[name = tensor("aw_313_cast_fp16")]; tensor var_4796_equation_0 = const()[name = tensor("op_4796_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4796_cast_fp16 = einsum(equation = var_4796_equation_0, values = (var_4638_cast_fp16, var_4555_cast_fp16))[name = tensor("op_4796_cast_fp16")]; tensor var_4797_to_fp16 = const()[name = tensor("op_4797_to_fp16"), val = tensor(0x1p-3)]; tensor aw_315_cast_fp16 = mul(x = var_4796_cast_fp16, y = var_4797_to_fp16)[name = tensor("aw_315_cast_fp16")]; tensor var_4800_equation_0 = const()[name = tensor("op_4800_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4800_cast_fp16 = einsum(equation = var_4800_equation_0, values = (var_4642_cast_fp16, var_4559_cast_fp16))[name = tensor("op_4800_cast_fp16")]; tensor var_4801_to_fp16 = const()[name = tensor("op_4801_to_fp16"), val = tensor(0x1p-3)]; tensor aw_317_cast_fp16 = mul(x = var_4800_cast_fp16, y = var_4801_to_fp16)[name = tensor("aw_317_cast_fp16")]; tensor var_4804_equation_0 = const()[name = tensor("op_4804_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_4804_cast_fp16 = einsum(equation = var_4804_equation_0, values = (var_4646_cast_fp16, var_4563_cast_fp16))[name = tensor("op_4804_cast_fp16")]; tensor var_4805_to_fp16 = const()[name = tensor("op_4805_to_fp16"), val = tensor(0x1p-3)]; tensor aw_319_cast_fp16 = mul(x = var_4804_cast_fp16, y = var_4805_to_fp16)[name = tensor("aw_319_cast_fp16")]; tensor var_4807_cast_fp16 = softmax(axis = var_4371, x = aw_281_cast_fp16)[name = tensor("op_4807_cast_fp16")]; tensor var_4808_cast_fp16 = softmax(axis = var_4371, x = aw_283_cast_fp16)[name = tensor("op_4808_cast_fp16")]; tensor var_4809_cast_fp16 = softmax(axis = var_4371, x = aw_285_cast_fp16)[name = tensor("op_4809_cast_fp16")]; tensor var_4810_cast_fp16 = softmax(axis = var_4371, x = aw_287_cast_fp16)[name = tensor("op_4810_cast_fp16")]; tensor var_4811_cast_fp16 = softmax(axis = var_4371, x = aw_289_cast_fp16)[name = tensor("op_4811_cast_fp16")]; tensor var_4812_cast_fp16 = softmax(axis = var_4371, x = aw_291_cast_fp16)[name = tensor("op_4812_cast_fp16")]; tensor var_4813_cast_fp16 = softmax(axis = var_4371, x = aw_293_cast_fp16)[name = tensor("op_4813_cast_fp16")]; tensor var_4814_cast_fp16 = softmax(axis = var_4371, x = aw_295_cast_fp16)[name = tensor("op_4814_cast_fp16")]; tensor var_4815_cast_fp16 = softmax(axis = var_4371, x = aw_297_cast_fp16)[name = tensor("op_4815_cast_fp16")]; tensor var_4816_cast_fp16 = softmax(axis = var_4371, x = aw_299_cast_fp16)[name = tensor("op_4816_cast_fp16")]; tensor var_4817_cast_fp16 = softmax(axis = var_4371, x = aw_301_cast_fp16)[name = tensor("op_4817_cast_fp16")]; tensor var_4818_cast_fp16 = softmax(axis = var_4371, x = aw_303_cast_fp16)[name = tensor("op_4818_cast_fp16")]; tensor var_4819_cast_fp16 = softmax(axis = var_4371, x = aw_305_cast_fp16)[name = tensor("op_4819_cast_fp16")]; tensor var_4820_cast_fp16 = softmax(axis = var_4371, x = aw_307_cast_fp16)[name = tensor("op_4820_cast_fp16")]; tensor var_4821_cast_fp16 = softmax(axis = var_4371, x = aw_309_cast_fp16)[name = tensor("op_4821_cast_fp16")]; tensor var_4822_cast_fp16 = softmax(axis = var_4371, x = aw_311_cast_fp16)[name = tensor("op_4822_cast_fp16")]; tensor var_4823_cast_fp16 = softmax(axis = var_4371, x = aw_313_cast_fp16)[name = tensor("op_4823_cast_fp16")]; tensor var_4824_cast_fp16 = softmax(axis = var_4371, x = aw_315_cast_fp16)[name = tensor("op_4824_cast_fp16")]; tensor var_4825_cast_fp16 = softmax(axis = var_4371, x = aw_317_cast_fp16)[name = tensor("op_4825_cast_fp16")]; tensor var_4826_cast_fp16 = softmax(axis = var_4371, x = aw_319_cast_fp16)[name = tensor("op_4826_cast_fp16")]; tensor var_4828_equation_0 = const()[name = tensor("op_4828_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4828_cast_fp16 = einsum(equation = var_4828_equation_0, values = (var_4648_cast_fp16, var_4807_cast_fp16))[name = tensor("op_4828_cast_fp16")]; tensor var_4830_equation_0 = const()[name = tensor("op_4830_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4830_cast_fp16 = einsum(equation = var_4830_equation_0, values = (var_4652_cast_fp16, var_4808_cast_fp16))[name = tensor("op_4830_cast_fp16")]; tensor var_4832_equation_0 = const()[name = tensor("op_4832_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4832_cast_fp16 = einsum(equation = var_4832_equation_0, values = (var_4656_cast_fp16, var_4809_cast_fp16))[name = tensor("op_4832_cast_fp16")]; tensor var_4834_equation_0 = const()[name = tensor("op_4834_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4834_cast_fp16 = einsum(equation = var_4834_equation_0, values = (var_4660_cast_fp16, var_4810_cast_fp16))[name = tensor("op_4834_cast_fp16")]; tensor var_4836_equation_0 = const()[name = tensor("op_4836_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4836_cast_fp16 = einsum(equation = var_4836_equation_0, values = (var_4664_cast_fp16, var_4811_cast_fp16))[name = tensor("op_4836_cast_fp16")]; tensor var_4838_equation_0 = const()[name = tensor("op_4838_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4838_cast_fp16 = einsum(equation = var_4838_equation_0, values = (var_4668_cast_fp16, var_4812_cast_fp16))[name = tensor("op_4838_cast_fp16")]; tensor var_4840_equation_0 = const()[name = tensor("op_4840_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4840_cast_fp16 = einsum(equation = var_4840_equation_0, values = (var_4672_cast_fp16, var_4813_cast_fp16))[name = tensor("op_4840_cast_fp16")]; tensor var_4842_equation_0 = const()[name = tensor("op_4842_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4842_cast_fp16 = einsum(equation = var_4842_equation_0, values = (var_4676_cast_fp16, var_4814_cast_fp16))[name = tensor("op_4842_cast_fp16")]; tensor var_4844_equation_0 = const()[name = tensor("op_4844_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4844_cast_fp16 = einsum(equation = var_4844_equation_0, values = (var_4680_cast_fp16, var_4815_cast_fp16))[name = tensor("op_4844_cast_fp16")]; tensor var_4846_equation_0 = const()[name = tensor("op_4846_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4846_cast_fp16 = einsum(equation = var_4846_equation_0, values = (var_4684_cast_fp16, var_4816_cast_fp16))[name = tensor("op_4846_cast_fp16")]; tensor var_4848_equation_0 = const()[name = tensor("op_4848_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4848_cast_fp16 = einsum(equation = var_4848_equation_0, values = (var_4688_cast_fp16, var_4817_cast_fp16))[name = tensor("op_4848_cast_fp16")]; tensor var_4850_equation_0 = const()[name = tensor("op_4850_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4850_cast_fp16 = einsum(equation = var_4850_equation_0, values = (var_4692_cast_fp16, var_4818_cast_fp16))[name = tensor("op_4850_cast_fp16")]; tensor var_4852_equation_0 = const()[name = tensor("op_4852_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4852_cast_fp16 = einsum(equation = var_4852_equation_0, values = (var_4696_cast_fp16, var_4819_cast_fp16))[name = tensor("op_4852_cast_fp16")]; tensor var_4854_equation_0 = const()[name = tensor("op_4854_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4854_cast_fp16 = einsum(equation = var_4854_equation_0, values = (var_4700_cast_fp16, var_4820_cast_fp16))[name = tensor("op_4854_cast_fp16")]; tensor var_4856_equation_0 = const()[name = tensor("op_4856_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4856_cast_fp16 = einsum(equation = var_4856_equation_0, values = (var_4704_cast_fp16, var_4821_cast_fp16))[name = tensor("op_4856_cast_fp16")]; tensor var_4858_equation_0 = const()[name = tensor("op_4858_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4858_cast_fp16 = einsum(equation = var_4858_equation_0, values = (var_4708_cast_fp16, var_4822_cast_fp16))[name = tensor("op_4858_cast_fp16")]; tensor var_4860_equation_0 = const()[name = tensor("op_4860_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4860_cast_fp16 = einsum(equation = var_4860_equation_0, values = (var_4712_cast_fp16, var_4823_cast_fp16))[name = tensor("op_4860_cast_fp16")]; tensor var_4862_equation_0 = const()[name = tensor("op_4862_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4862_cast_fp16 = einsum(equation = var_4862_equation_0, values = (var_4716_cast_fp16, var_4824_cast_fp16))[name = tensor("op_4862_cast_fp16")]; tensor var_4864_equation_0 = const()[name = tensor("op_4864_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4864_cast_fp16 = einsum(equation = var_4864_equation_0, values = (var_4720_cast_fp16, var_4825_cast_fp16))[name = tensor("op_4864_cast_fp16")]; tensor var_4866_equation_0 = const()[name = tensor("op_4866_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_4866_cast_fp16 = einsum(equation = var_4866_equation_0, values = (var_4724_cast_fp16, var_4826_cast_fp16))[name = tensor("op_4866_cast_fp16")]; tensor input_215_interleave_0 = const()[name = tensor("input_215_interleave_0"), val = tensor(false)]; tensor input_215_cast_fp16 = concat(axis = var_4371, interleave = input_215_interleave_0, values = (var_4828_cast_fp16, var_4830_cast_fp16, var_4832_cast_fp16, var_4834_cast_fp16, var_4836_cast_fp16, var_4838_cast_fp16, var_4840_cast_fp16, var_4842_cast_fp16, var_4844_cast_fp16, var_4846_cast_fp16, var_4848_cast_fp16, var_4850_cast_fp16, var_4852_cast_fp16, var_4854_cast_fp16, var_4856_cast_fp16, var_4858_cast_fp16, var_4860_cast_fp16, var_4862_cast_fp16, var_4864_cast_fp16, var_4866_cast_fp16))[name = tensor("input_215_cast_fp16")]; tensor var_4872 = const()[name = tensor("op_4872"), val = tensor([1, 1])]; tensor var_4874 = const()[name = tensor("op_4874"), val = tensor([1, 1])]; tensor var_4876_pad_type_0 = const()[name = tensor("op_4876_pad_type_0"), val = tensor("custom")]; tensor var_4876_pad_0 = const()[name = tensor("op_4876_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(583361536)))]; tensor mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(586638400)))]; tensor var_4876_cast_fp16 = conv(bias = mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_bias_to_fp16, dilations = var_4874, groups = var_4371, pad = var_4876_pad_0, pad_type = var_4876_pad_type_0, strides = var_4872, weight = mid_block_attentions_0_transformer_blocks_0_attn1_to_out_0_weight_to_fp16, x = input_215_cast_fp16)[name = tensor("op_4876_cast_fp16")]; tensor inputs_39_cast_fp16 = add(x = var_4876_cast_fp16, y = inputs_37_cast_fp16)[name = tensor("inputs_39_cast_fp16")]; tensor var_4880 = const()[name = tensor("op_4880"), val = tensor([1])]; tensor channels_mean_39_cast_fp16 = reduce_mean(axes = var_4880, keep_dims = var_4366, x = inputs_39_cast_fp16)[name = tensor("channels_mean_39_cast_fp16")]; tensor zero_mean_39_cast_fp16 = sub(x = inputs_39_cast_fp16, y = channels_mean_39_cast_fp16)[name = tensor("zero_mean_39_cast_fp16")]; tensor zero_mean_sq_39_cast_fp16 = mul(x = zero_mean_39_cast_fp16, y = zero_mean_39_cast_fp16)[name = tensor("zero_mean_sq_39_cast_fp16")]; tensor var_4884 = const()[name = tensor("op_4884"), val = tensor([1])]; tensor var_4885_cast_fp16 = reduce_mean(axes = var_4884, keep_dims = var_4366, x = zero_mean_sq_39_cast_fp16)[name = tensor("op_4885_cast_fp16")]; tensor var_4886_to_fp16 = const()[name = tensor("op_4886_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_4887_cast_fp16 = add(x = var_4885_cast_fp16, y = var_4886_to_fp16)[name = tensor("op_4887_cast_fp16")]; tensor denom_39_epsilon_0_to_fp16 = const()[name = tensor("denom_39_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_39_cast_fp16 = rsqrt(epsilon = denom_39_epsilon_0_to_fp16, x = var_4887_cast_fp16)[name = tensor("denom_39_cast_fp16")]; tensor out_39_cast_fp16 = mul(x = zero_mean_39_cast_fp16, y = denom_39_cast_fp16)[name = tensor("out_39_cast_fp16")]; tensor var_4891_to_fp16 = const()[name = tensor("op_4891_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(586641024)))]; tensor var_4892_cast_fp16 = add(x = out_39_cast_fp16, y = var_4891_to_fp16)[name = tensor("op_4892_cast_fp16")]; tensor var_4894_to_fp16 = const()[name = tensor("op_4894_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(586643648)))]; tensor hidden_states_127_cast_fp16 = mul(x = var_4892_cast_fp16, y = var_4894_to_fp16)[name = tensor("hidden_states_127_cast_fp16")]; tensor var_4901 = const()[name = tensor("op_4901"), val = tensor([1, 1])]; tensor var_4903 = const()[name = tensor("op_4903"), val = tensor([1, 1])]; tensor q_27_pad_type_0 = const()[name = tensor("q_27_pad_type_0"), val = tensor("custom")]; tensor q_27_pad_0 = const()[name = tensor("q_27_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(586646272)))]; tensor q_27_cast_fp16 = conv(dilations = var_4903, groups = var_4371, pad = q_27_pad_0, pad_type = q_27_pad_type_0, strides = var_4901, weight = mid_block_attentions_0_transformer_blocks_0_attn2_to_q_weight_to_fp16, x = hidden_states_127_cast_fp16)[name = tensor("q_27_cast_fp16")]; tensor var_4907 = const()[name = tensor("op_4907"), val = tensor([1, 1])]; tensor var_4909 = const()[name = tensor("op_4909"), val = tensor([1, 1])]; tensor k_53_pad_type_0 = const()[name = tensor("k_53_pad_type_0"), val = tensor("custom")]; tensor k_53_pad_0 = const()[name = tensor("k_53_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589923136)))]; tensor k_53_cast_fp16 = conv(dilations = var_4909, groups = var_4371, pad = k_53_pad_0, pad_type = k_53_pad_type_0, strides = var_4907, weight = mid_block_attentions_0_transformer_blocks_0_attn2_to_k_weight_to_fp16, x = encoder_hidden_states)[name = tensor("k_53_cast_fp16")]; tensor var_4913 = const()[name = tensor("op_4913"), val = tensor([1, 1])]; tensor var_4915 = const()[name = tensor("op_4915"), val = tensor([1, 1])]; tensor v_27_pad_type_0 = const()[name = tensor("v_27_pad_type_0"), val = tensor("custom")]; tensor v_27_pad_0 = const()[name = tensor("v_27_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(592544640)))]; tensor v_27_cast_fp16 = conv(dilations = var_4915, groups = var_4371, pad = v_27_pad_0, pad_type = v_27_pad_type_0, strides = var_4913, weight = mid_block_attentions_0_transformer_blocks_0_attn2_to_v_weight_to_fp16, x = encoder_hidden_states)[name = tensor("v_27_cast_fp16")]; tensor var_4919_begin_0 = const()[name = tensor("op_4919_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_4919_end_0 = const()[name = tensor("op_4919_end_0"), val = tensor([2, 64, 1, 36])]; tensor var_4919_end_mask_0 = const()[name = tensor("op_4919_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4919_cast_fp16 = slice_by_index(begin = var_4919_begin_0, end = var_4919_end_0, end_mask = var_4919_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4919_cast_fp16")]; tensor var_4923_begin_0 = const()[name = tensor("op_4923_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_4923_end_0 = const()[name = tensor("op_4923_end_0"), val = tensor([2, 128, 1, 36])]; tensor var_4923_end_mask_0 = const()[name = tensor("op_4923_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4923_cast_fp16 = slice_by_index(begin = var_4923_begin_0, end = var_4923_end_0, end_mask = var_4923_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4923_cast_fp16")]; tensor var_4927_begin_0 = const()[name = tensor("op_4927_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_4927_end_0 = const()[name = tensor("op_4927_end_0"), val = tensor([2, 192, 1, 36])]; tensor var_4927_end_mask_0 = const()[name = tensor("op_4927_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4927_cast_fp16 = slice_by_index(begin = var_4927_begin_0, end = var_4927_end_0, end_mask = var_4927_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4927_cast_fp16")]; tensor var_4931_begin_0 = const()[name = tensor("op_4931_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_4931_end_0 = const()[name = tensor("op_4931_end_0"), val = tensor([2, 256, 1, 36])]; tensor var_4931_end_mask_0 = const()[name = tensor("op_4931_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4931_cast_fp16 = slice_by_index(begin = var_4931_begin_0, end = var_4931_end_0, end_mask = var_4931_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4931_cast_fp16")]; tensor var_4935_begin_0 = const()[name = tensor("op_4935_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_4935_end_0 = const()[name = tensor("op_4935_end_0"), val = tensor([2, 320, 1, 36])]; tensor var_4935_end_mask_0 = const()[name = tensor("op_4935_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4935_cast_fp16 = slice_by_index(begin = var_4935_begin_0, end = var_4935_end_0, end_mask = var_4935_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4935_cast_fp16")]; tensor var_4939_begin_0 = const()[name = tensor("op_4939_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_4939_end_0 = const()[name = tensor("op_4939_end_0"), val = tensor([2, 384, 1, 36])]; tensor var_4939_end_mask_0 = const()[name = tensor("op_4939_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4939_cast_fp16 = slice_by_index(begin = var_4939_begin_0, end = var_4939_end_0, end_mask = var_4939_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4939_cast_fp16")]; tensor var_4943_begin_0 = const()[name = tensor("op_4943_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_4943_end_0 = const()[name = tensor("op_4943_end_0"), val = tensor([2, 448, 1, 36])]; tensor var_4943_end_mask_0 = const()[name = tensor("op_4943_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4943_cast_fp16 = slice_by_index(begin = var_4943_begin_0, end = var_4943_end_0, end_mask = var_4943_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4943_cast_fp16")]; tensor var_4947_begin_0 = const()[name = tensor("op_4947_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_4947_end_0 = const()[name = tensor("op_4947_end_0"), val = tensor([2, 512, 1, 36])]; tensor var_4947_end_mask_0 = const()[name = tensor("op_4947_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4947_cast_fp16 = slice_by_index(begin = var_4947_begin_0, end = var_4947_end_0, end_mask = var_4947_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4947_cast_fp16")]; tensor var_4951_begin_0 = const()[name = tensor("op_4951_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_4951_end_0 = const()[name = tensor("op_4951_end_0"), val = tensor([2, 576, 1, 36])]; tensor var_4951_end_mask_0 = const()[name = tensor("op_4951_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4951_cast_fp16 = slice_by_index(begin = var_4951_begin_0, end = var_4951_end_0, end_mask = var_4951_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4951_cast_fp16")]; tensor var_4955_begin_0 = const()[name = tensor("op_4955_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_4955_end_0 = const()[name = tensor("op_4955_end_0"), val = tensor([2, 640, 1, 36])]; tensor var_4955_end_mask_0 = const()[name = tensor("op_4955_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4955_cast_fp16 = slice_by_index(begin = var_4955_begin_0, end = var_4955_end_0, end_mask = var_4955_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4955_cast_fp16")]; tensor var_4959_begin_0 = const()[name = tensor("op_4959_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_4959_end_0 = const()[name = tensor("op_4959_end_0"), val = tensor([2, 704, 1, 36])]; tensor var_4959_end_mask_0 = const()[name = tensor("op_4959_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4959_cast_fp16 = slice_by_index(begin = var_4959_begin_0, end = var_4959_end_0, end_mask = var_4959_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4959_cast_fp16")]; tensor var_4963_begin_0 = const()[name = tensor("op_4963_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_4963_end_0 = const()[name = tensor("op_4963_end_0"), val = tensor([2, 768, 1, 36])]; tensor var_4963_end_mask_0 = const()[name = tensor("op_4963_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4963_cast_fp16 = slice_by_index(begin = var_4963_begin_0, end = var_4963_end_0, end_mask = var_4963_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4963_cast_fp16")]; tensor var_4967_begin_0 = const()[name = tensor("op_4967_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_4967_end_0 = const()[name = tensor("op_4967_end_0"), val = tensor([2, 832, 1, 36])]; tensor var_4967_end_mask_0 = const()[name = tensor("op_4967_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4967_cast_fp16 = slice_by_index(begin = var_4967_begin_0, end = var_4967_end_0, end_mask = var_4967_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4967_cast_fp16")]; tensor var_4971_begin_0 = const()[name = tensor("op_4971_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_4971_end_0 = const()[name = tensor("op_4971_end_0"), val = tensor([2, 896, 1, 36])]; tensor var_4971_end_mask_0 = const()[name = tensor("op_4971_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4971_cast_fp16 = slice_by_index(begin = var_4971_begin_0, end = var_4971_end_0, end_mask = var_4971_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4971_cast_fp16")]; tensor var_4975_begin_0 = const()[name = tensor("op_4975_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_4975_end_0 = const()[name = tensor("op_4975_end_0"), val = tensor([2, 960, 1, 36])]; tensor var_4975_end_mask_0 = const()[name = tensor("op_4975_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4975_cast_fp16 = slice_by_index(begin = var_4975_begin_0, end = var_4975_end_0, end_mask = var_4975_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4975_cast_fp16")]; tensor var_4979_begin_0 = const()[name = tensor("op_4979_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_4979_end_0 = const()[name = tensor("op_4979_end_0"), val = tensor([2, 1024, 1, 36])]; tensor var_4979_end_mask_0 = const()[name = tensor("op_4979_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4979_cast_fp16 = slice_by_index(begin = var_4979_begin_0, end = var_4979_end_0, end_mask = var_4979_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4979_cast_fp16")]; tensor var_4983_begin_0 = const()[name = tensor("op_4983_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_4983_end_0 = const()[name = tensor("op_4983_end_0"), val = tensor([2, 1088, 1, 36])]; tensor var_4983_end_mask_0 = const()[name = tensor("op_4983_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4983_cast_fp16 = slice_by_index(begin = var_4983_begin_0, end = var_4983_end_0, end_mask = var_4983_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4983_cast_fp16")]; tensor var_4987_begin_0 = const()[name = tensor("op_4987_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_4987_end_0 = const()[name = tensor("op_4987_end_0"), val = tensor([2, 1152, 1, 36])]; tensor var_4987_end_mask_0 = const()[name = tensor("op_4987_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4987_cast_fp16 = slice_by_index(begin = var_4987_begin_0, end = var_4987_end_0, end_mask = var_4987_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4987_cast_fp16")]; tensor var_4991_begin_0 = const()[name = tensor("op_4991_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_4991_end_0 = const()[name = tensor("op_4991_end_0"), val = tensor([2, 1216, 1, 36])]; tensor var_4991_end_mask_0 = const()[name = tensor("op_4991_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4991_cast_fp16 = slice_by_index(begin = var_4991_begin_0, end = var_4991_end_0, end_mask = var_4991_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4991_cast_fp16")]; tensor var_4995_begin_0 = const()[name = tensor("op_4995_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_4995_end_0 = const()[name = tensor("op_4995_end_0"), val = tensor([2, 1280, 1, 36])]; tensor var_4995_end_mask_0 = const()[name = tensor("op_4995_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_4995_cast_fp16 = slice_by_index(begin = var_4995_begin_0, end = var_4995_end_0, end_mask = var_4995_end_mask_0, x = q_27_cast_fp16)[name = tensor("op_4995_cast_fp16")]; tensor k_55_perm_0 = const()[name = tensor("k_55_perm_0"), val = tensor([0, 3, 2, 1])]; tensor var_5002_begin_0 = const()[name = tensor("op_5002_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_5002_end_0 = const()[name = tensor("op_5002_end_0"), val = tensor([2, 77, 1, 64])]; tensor var_5002_end_mask_0 = const()[name = tensor("op_5002_end_mask_0"), val = tensor([true, true, true, false])]; tensor transpose_0 = transpose(perm = k_55_perm_0, x = k_53_cast_fp16)[name = tensor("transpose_0")]; tensor var_5002_cast_fp16 = slice_by_index(begin = var_5002_begin_0, end = var_5002_end_0, end_mask = var_5002_end_mask_0, x = transpose_0)[name = tensor("op_5002_cast_fp16")]; tensor var_5006_begin_0 = const()[name = tensor("op_5006_begin_0"), val = tensor([0, 0, 0, 64])]; tensor var_5006_end_0 = const()[name = tensor("op_5006_end_0"), val = tensor([2, 77, 1, 128])]; tensor var_5006_end_mask_0 = const()[name = tensor("op_5006_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5006_cast_fp16 = slice_by_index(begin = var_5006_begin_0, end = var_5006_end_0, end_mask = var_5006_end_mask_0, x = transpose_0)[name = tensor("op_5006_cast_fp16")]; tensor var_5010_begin_0 = const()[name = tensor("op_5010_begin_0"), val = tensor([0, 0, 0, 128])]; tensor var_5010_end_0 = const()[name = tensor("op_5010_end_0"), val = tensor([2, 77, 1, 192])]; tensor var_5010_end_mask_0 = const()[name = tensor("op_5010_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5010_cast_fp16 = slice_by_index(begin = var_5010_begin_0, end = var_5010_end_0, end_mask = var_5010_end_mask_0, x = transpose_0)[name = tensor("op_5010_cast_fp16")]; tensor var_5014_begin_0 = const()[name = tensor("op_5014_begin_0"), val = tensor([0, 0, 0, 192])]; tensor var_5014_end_0 = const()[name = tensor("op_5014_end_0"), val = tensor([2, 77, 1, 256])]; tensor var_5014_end_mask_0 = const()[name = tensor("op_5014_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5014_cast_fp16 = slice_by_index(begin = var_5014_begin_0, end = var_5014_end_0, end_mask = var_5014_end_mask_0, x = transpose_0)[name = tensor("op_5014_cast_fp16")]; tensor var_5018_begin_0 = const()[name = tensor("op_5018_begin_0"), val = tensor([0, 0, 0, 256])]; tensor var_5018_end_0 = const()[name = tensor("op_5018_end_0"), val = tensor([2, 77, 1, 320])]; tensor var_5018_end_mask_0 = const()[name = tensor("op_5018_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5018_cast_fp16 = slice_by_index(begin = var_5018_begin_0, end = var_5018_end_0, end_mask = var_5018_end_mask_0, x = transpose_0)[name = tensor("op_5018_cast_fp16")]; tensor var_5022_begin_0 = const()[name = tensor("op_5022_begin_0"), val = tensor([0, 0, 0, 320])]; tensor var_5022_end_0 = const()[name = tensor("op_5022_end_0"), val = tensor([2, 77, 1, 384])]; tensor var_5022_end_mask_0 = const()[name = tensor("op_5022_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5022_cast_fp16 = slice_by_index(begin = var_5022_begin_0, end = var_5022_end_0, end_mask = var_5022_end_mask_0, x = transpose_0)[name = tensor("op_5022_cast_fp16")]; tensor var_5026_begin_0 = const()[name = tensor("op_5026_begin_0"), val = tensor([0, 0, 0, 384])]; tensor var_5026_end_0 = const()[name = tensor("op_5026_end_0"), val = tensor([2, 77, 1, 448])]; tensor var_5026_end_mask_0 = const()[name = tensor("op_5026_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5026_cast_fp16 = slice_by_index(begin = var_5026_begin_0, end = var_5026_end_0, end_mask = var_5026_end_mask_0, x = transpose_0)[name = tensor("op_5026_cast_fp16")]; tensor var_5030_begin_0 = const()[name = tensor("op_5030_begin_0"), val = tensor([0, 0, 0, 448])]; tensor var_5030_end_0 = const()[name = tensor("op_5030_end_0"), val = tensor([2, 77, 1, 512])]; tensor var_5030_end_mask_0 = const()[name = tensor("op_5030_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5030_cast_fp16 = slice_by_index(begin = var_5030_begin_0, end = var_5030_end_0, end_mask = var_5030_end_mask_0, x = transpose_0)[name = tensor("op_5030_cast_fp16")]; tensor var_5034_begin_0 = const()[name = tensor("op_5034_begin_0"), val = tensor([0, 0, 0, 512])]; tensor var_5034_end_0 = const()[name = tensor("op_5034_end_0"), val = tensor([2, 77, 1, 576])]; tensor var_5034_end_mask_0 = const()[name = tensor("op_5034_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5034_cast_fp16 = slice_by_index(begin = var_5034_begin_0, end = var_5034_end_0, end_mask = var_5034_end_mask_0, x = transpose_0)[name = tensor("op_5034_cast_fp16")]; tensor var_5038_begin_0 = const()[name = tensor("op_5038_begin_0"), val = tensor([0, 0, 0, 576])]; tensor var_5038_end_0 = const()[name = tensor("op_5038_end_0"), val = tensor([2, 77, 1, 640])]; tensor var_5038_end_mask_0 = const()[name = tensor("op_5038_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5038_cast_fp16 = slice_by_index(begin = var_5038_begin_0, end = var_5038_end_0, end_mask = var_5038_end_mask_0, x = transpose_0)[name = tensor("op_5038_cast_fp16")]; tensor var_5042_begin_0 = const()[name = tensor("op_5042_begin_0"), val = tensor([0, 0, 0, 640])]; tensor var_5042_end_0 = const()[name = tensor("op_5042_end_0"), val = tensor([2, 77, 1, 704])]; tensor var_5042_end_mask_0 = const()[name = tensor("op_5042_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5042_cast_fp16 = slice_by_index(begin = var_5042_begin_0, end = var_5042_end_0, end_mask = var_5042_end_mask_0, x = transpose_0)[name = tensor("op_5042_cast_fp16")]; tensor var_5046_begin_0 = const()[name = tensor("op_5046_begin_0"), val = tensor([0, 0, 0, 704])]; tensor var_5046_end_0 = const()[name = tensor("op_5046_end_0"), val = tensor([2, 77, 1, 768])]; tensor var_5046_end_mask_0 = const()[name = tensor("op_5046_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5046_cast_fp16 = slice_by_index(begin = var_5046_begin_0, end = var_5046_end_0, end_mask = var_5046_end_mask_0, x = transpose_0)[name = tensor("op_5046_cast_fp16")]; tensor var_5050_begin_0 = const()[name = tensor("op_5050_begin_0"), val = tensor([0, 0, 0, 768])]; tensor var_5050_end_0 = const()[name = tensor("op_5050_end_0"), val = tensor([2, 77, 1, 832])]; tensor var_5050_end_mask_0 = const()[name = tensor("op_5050_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5050_cast_fp16 = slice_by_index(begin = var_5050_begin_0, end = var_5050_end_0, end_mask = var_5050_end_mask_0, x = transpose_0)[name = tensor("op_5050_cast_fp16")]; tensor var_5054_begin_0 = const()[name = tensor("op_5054_begin_0"), val = tensor([0, 0, 0, 832])]; tensor var_5054_end_0 = const()[name = tensor("op_5054_end_0"), val = tensor([2, 77, 1, 896])]; tensor var_5054_end_mask_0 = const()[name = tensor("op_5054_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5054_cast_fp16 = slice_by_index(begin = var_5054_begin_0, end = var_5054_end_0, end_mask = var_5054_end_mask_0, x = transpose_0)[name = tensor("op_5054_cast_fp16")]; tensor var_5058_begin_0 = const()[name = tensor("op_5058_begin_0"), val = tensor([0, 0, 0, 896])]; tensor var_5058_end_0 = const()[name = tensor("op_5058_end_0"), val = tensor([2, 77, 1, 960])]; tensor var_5058_end_mask_0 = const()[name = tensor("op_5058_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5058_cast_fp16 = slice_by_index(begin = var_5058_begin_0, end = var_5058_end_0, end_mask = var_5058_end_mask_0, x = transpose_0)[name = tensor("op_5058_cast_fp16")]; tensor var_5062_begin_0 = const()[name = tensor("op_5062_begin_0"), val = tensor([0, 0, 0, 960])]; tensor var_5062_end_0 = const()[name = tensor("op_5062_end_0"), val = tensor([2, 77, 1, 1024])]; tensor var_5062_end_mask_0 = const()[name = tensor("op_5062_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5062_cast_fp16 = slice_by_index(begin = var_5062_begin_0, end = var_5062_end_0, end_mask = var_5062_end_mask_0, x = transpose_0)[name = tensor("op_5062_cast_fp16")]; tensor var_5066_begin_0 = const()[name = tensor("op_5066_begin_0"), val = tensor([0, 0, 0, 1024])]; tensor var_5066_end_0 = const()[name = tensor("op_5066_end_0"), val = tensor([2, 77, 1, 1088])]; tensor var_5066_end_mask_0 = const()[name = tensor("op_5066_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5066_cast_fp16 = slice_by_index(begin = var_5066_begin_0, end = var_5066_end_0, end_mask = var_5066_end_mask_0, x = transpose_0)[name = tensor("op_5066_cast_fp16")]; tensor var_5070_begin_0 = const()[name = tensor("op_5070_begin_0"), val = tensor([0, 0, 0, 1088])]; tensor var_5070_end_0 = const()[name = tensor("op_5070_end_0"), val = tensor([2, 77, 1, 1152])]; tensor var_5070_end_mask_0 = const()[name = tensor("op_5070_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5070_cast_fp16 = slice_by_index(begin = var_5070_begin_0, end = var_5070_end_0, end_mask = var_5070_end_mask_0, x = transpose_0)[name = tensor("op_5070_cast_fp16")]; tensor var_5074_begin_0 = const()[name = tensor("op_5074_begin_0"), val = tensor([0, 0, 0, 1152])]; tensor var_5074_end_0 = const()[name = tensor("op_5074_end_0"), val = tensor([2, 77, 1, 1216])]; tensor var_5074_end_mask_0 = const()[name = tensor("op_5074_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5074_cast_fp16 = slice_by_index(begin = var_5074_begin_0, end = var_5074_end_0, end_mask = var_5074_end_mask_0, x = transpose_0)[name = tensor("op_5074_cast_fp16")]; tensor var_5078_begin_0 = const()[name = tensor("op_5078_begin_0"), val = tensor([0, 0, 0, 1216])]; tensor var_5078_end_0 = const()[name = tensor("op_5078_end_0"), val = tensor([2, 77, 1, 1280])]; tensor var_5078_end_mask_0 = const()[name = tensor("op_5078_end_mask_0"), val = tensor([true, true, true, false])]; tensor var_5078_cast_fp16 = slice_by_index(begin = var_5078_begin_0, end = var_5078_end_0, end_mask = var_5078_end_mask_0, x = transpose_0)[name = tensor("op_5078_cast_fp16")]; tensor var_5080_begin_0 = const()[name = tensor("op_5080_begin_0"), val = tensor([0, 0, 0, 0])]; tensor var_5080_end_0 = const()[name = tensor("op_5080_end_0"), val = tensor([2, 64, 1, 77])]; tensor var_5080_end_mask_0 = const()[name = tensor("op_5080_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5080_cast_fp16 = slice_by_index(begin = var_5080_begin_0, end = var_5080_end_0, end_mask = var_5080_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5080_cast_fp16")]; tensor var_5084_begin_0 = const()[name = tensor("op_5084_begin_0"), val = tensor([0, 64, 0, 0])]; tensor var_5084_end_0 = const()[name = tensor("op_5084_end_0"), val = tensor([2, 128, 1, 77])]; tensor var_5084_end_mask_0 = const()[name = tensor("op_5084_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5084_cast_fp16 = slice_by_index(begin = var_5084_begin_0, end = var_5084_end_0, end_mask = var_5084_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5084_cast_fp16")]; tensor var_5088_begin_0 = const()[name = tensor("op_5088_begin_0"), val = tensor([0, 128, 0, 0])]; tensor var_5088_end_0 = const()[name = tensor("op_5088_end_0"), val = tensor([2, 192, 1, 77])]; tensor var_5088_end_mask_0 = const()[name = tensor("op_5088_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5088_cast_fp16 = slice_by_index(begin = var_5088_begin_0, end = var_5088_end_0, end_mask = var_5088_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5088_cast_fp16")]; tensor var_5092_begin_0 = const()[name = tensor("op_5092_begin_0"), val = tensor([0, 192, 0, 0])]; tensor var_5092_end_0 = const()[name = tensor("op_5092_end_0"), val = tensor([2, 256, 1, 77])]; tensor var_5092_end_mask_0 = const()[name = tensor("op_5092_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5092_cast_fp16 = slice_by_index(begin = var_5092_begin_0, end = var_5092_end_0, end_mask = var_5092_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5092_cast_fp16")]; tensor var_5096_begin_0 = const()[name = tensor("op_5096_begin_0"), val = tensor([0, 256, 0, 0])]; tensor var_5096_end_0 = const()[name = tensor("op_5096_end_0"), val = tensor([2, 320, 1, 77])]; tensor var_5096_end_mask_0 = const()[name = tensor("op_5096_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5096_cast_fp16 = slice_by_index(begin = var_5096_begin_0, end = var_5096_end_0, end_mask = var_5096_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5096_cast_fp16")]; tensor var_5100_begin_0 = const()[name = tensor("op_5100_begin_0"), val = tensor([0, 320, 0, 0])]; tensor var_5100_end_0 = const()[name = tensor("op_5100_end_0"), val = tensor([2, 384, 1, 77])]; tensor var_5100_end_mask_0 = const()[name = tensor("op_5100_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5100_cast_fp16 = slice_by_index(begin = var_5100_begin_0, end = var_5100_end_0, end_mask = var_5100_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5100_cast_fp16")]; tensor var_5104_begin_0 = const()[name = tensor("op_5104_begin_0"), val = tensor([0, 384, 0, 0])]; tensor var_5104_end_0 = const()[name = tensor("op_5104_end_0"), val = tensor([2, 448, 1, 77])]; tensor var_5104_end_mask_0 = const()[name = tensor("op_5104_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5104_cast_fp16 = slice_by_index(begin = var_5104_begin_0, end = var_5104_end_0, end_mask = var_5104_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5104_cast_fp16")]; tensor var_5108_begin_0 = const()[name = tensor("op_5108_begin_0"), val = tensor([0, 448, 0, 0])]; tensor var_5108_end_0 = const()[name = tensor("op_5108_end_0"), val = tensor([2, 512, 1, 77])]; tensor var_5108_end_mask_0 = const()[name = tensor("op_5108_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5108_cast_fp16 = slice_by_index(begin = var_5108_begin_0, end = var_5108_end_0, end_mask = var_5108_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5108_cast_fp16")]; tensor var_5112_begin_0 = const()[name = tensor("op_5112_begin_0"), val = tensor([0, 512, 0, 0])]; tensor var_5112_end_0 = const()[name = tensor("op_5112_end_0"), val = tensor([2, 576, 1, 77])]; tensor var_5112_end_mask_0 = const()[name = tensor("op_5112_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5112_cast_fp16 = slice_by_index(begin = var_5112_begin_0, end = var_5112_end_0, end_mask = var_5112_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5112_cast_fp16")]; tensor var_5116_begin_0 = const()[name = tensor("op_5116_begin_0"), val = tensor([0, 576, 0, 0])]; tensor var_5116_end_0 = const()[name = tensor("op_5116_end_0"), val = tensor([2, 640, 1, 77])]; tensor var_5116_end_mask_0 = const()[name = tensor("op_5116_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5116_cast_fp16 = slice_by_index(begin = var_5116_begin_0, end = var_5116_end_0, end_mask = var_5116_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5116_cast_fp16")]; tensor var_5120_begin_0 = const()[name = tensor("op_5120_begin_0"), val = tensor([0, 640, 0, 0])]; tensor var_5120_end_0 = const()[name = tensor("op_5120_end_0"), val = tensor([2, 704, 1, 77])]; tensor var_5120_end_mask_0 = const()[name = tensor("op_5120_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5120_cast_fp16 = slice_by_index(begin = var_5120_begin_0, end = var_5120_end_0, end_mask = var_5120_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5120_cast_fp16")]; tensor var_5124_begin_0 = const()[name = tensor("op_5124_begin_0"), val = tensor([0, 704, 0, 0])]; tensor var_5124_end_0 = const()[name = tensor("op_5124_end_0"), val = tensor([2, 768, 1, 77])]; tensor var_5124_end_mask_0 = const()[name = tensor("op_5124_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5124_cast_fp16 = slice_by_index(begin = var_5124_begin_0, end = var_5124_end_0, end_mask = var_5124_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5124_cast_fp16")]; tensor var_5128_begin_0 = const()[name = tensor("op_5128_begin_0"), val = tensor([0, 768, 0, 0])]; tensor var_5128_end_0 = const()[name = tensor("op_5128_end_0"), val = tensor([2, 832, 1, 77])]; tensor var_5128_end_mask_0 = const()[name = tensor("op_5128_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5128_cast_fp16 = slice_by_index(begin = var_5128_begin_0, end = var_5128_end_0, end_mask = var_5128_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5128_cast_fp16")]; tensor var_5132_begin_0 = const()[name = tensor("op_5132_begin_0"), val = tensor([0, 832, 0, 0])]; tensor var_5132_end_0 = const()[name = tensor("op_5132_end_0"), val = tensor([2, 896, 1, 77])]; tensor var_5132_end_mask_0 = const()[name = tensor("op_5132_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5132_cast_fp16 = slice_by_index(begin = var_5132_begin_0, end = var_5132_end_0, end_mask = var_5132_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5132_cast_fp16")]; tensor var_5136_begin_0 = const()[name = tensor("op_5136_begin_0"), val = tensor([0, 896, 0, 0])]; tensor var_5136_end_0 = const()[name = tensor("op_5136_end_0"), val = tensor([2, 960, 1, 77])]; tensor var_5136_end_mask_0 = const()[name = tensor("op_5136_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5136_cast_fp16 = slice_by_index(begin = var_5136_begin_0, end = var_5136_end_0, end_mask = var_5136_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5136_cast_fp16")]; tensor var_5140_begin_0 = const()[name = tensor("op_5140_begin_0"), val = tensor([0, 960, 0, 0])]; tensor var_5140_end_0 = const()[name = tensor("op_5140_end_0"), val = tensor([2, 1024, 1, 77])]; tensor var_5140_end_mask_0 = const()[name = tensor("op_5140_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5140_cast_fp16 = slice_by_index(begin = var_5140_begin_0, end = var_5140_end_0, end_mask = var_5140_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5140_cast_fp16")]; tensor var_5144_begin_0 = const()[name = tensor("op_5144_begin_0"), val = tensor([0, 1024, 0, 0])]; tensor var_5144_end_0 = const()[name = tensor("op_5144_end_0"), val = tensor([2, 1088, 1, 77])]; tensor var_5144_end_mask_0 = const()[name = tensor("op_5144_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5144_cast_fp16 = slice_by_index(begin = var_5144_begin_0, end = var_5144_end_0, end_mask = var_5144_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5144_cast_fp16")]; tensor var_5148_begin_0 = const()[name = tensor("op_5148_begin_0"), val = tensor([0, 1088, 0, 0])]; tensor var_5148_end_0 = const()[name = tensor("op_5148_end_0"), val = tensor([2, 1152, 1, 77])]; tensor var_5148_end_mask_0 = const()[name = tensor("op_5148_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5148_cast_fp16 = slice_by_index(begin = var_5148_begin_0, end = var_5148_end_0, end_mask = var_5148_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5148_cast_fp16")]; tensor var_5152_begin_0 = const()[name = tensor("op_5152_begin_0"), val = tensor([0, 1152, 0, 0])]; tensor var_5152_end_0 = const()[name = tensor("op_5152_end_0"), val = tensor([2, 1216, 1, 77])]; tensor var_5152_end_mask_0 = const()[name = tensor("op_5152_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5152_cast_fp16 = slice_by_index(begin = var_5152_begin_0, end = var_5152_end_0, end_mask = var_5152_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5152_cast_fp16")]; tensor var_5156_begin_0 = const()[name = tensor("op_5156_begin_0"), val = tensor([0, 1216, 0, 0])]; tensor var_5156_end_0 = const()[name = tensor("op_5156_end_0"), val = tensor([2, 1280, 1, 77])]; tensor var_5156_end_mask_0 = const()[name = tensor("op_5156_end_mask_0"), val = tensor([true, false, true, true])]; tensor var_5156_cast_fp16 = slice_by_index(begin = var_5156_begin_0, end = var_5156_end_0, end_mask = var_5156_end_mask_0, x = v_27_cast_fp16)[name = tensor("op_5156_cast_fp16")]; tensor var_5160_equation_0 = const()[name = tensor("op_5160_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5160_cast_fp16 = einsum(equation = var_5160_equation_0, values = (var_5002_cast_fp16, var_4919_cast_fp16))[name = tensor("op_5160_cast_fp16")]; tensor var_5161_to_fp16 = const()[name = tensor("op_5161_to_fp16"), val = tensor(0x1p-3)]; tensor aw_321_cast_fp16 = mul(x = var_5160_cast_fp16, y = var_5161_to_fp16)[name = tensor("aw_321_cast_fp16")]; tensor var_5164_equation_0 = const()[name = tensor("op_5164_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5164_cast_fp16 = einsum(equation = var_5164_equation_0, values = (var_5006_cast_fp16, var_4923_cast_fp16))[name = tensor("op_5164_cast_fp16")]; tensor var_5165_to_fp16 = const()[name = tensor("op_5165_to_fp16"), val = tensor(0x1p-3)]; tensor aw_323_cast_fp16 = mul(x = var_5164_cast_fp16, y = var_5165_to_fp16)[name = tensor("aw_323_cast_fp16")]; tensor var_5168_equation_0 = const()[name = tensor("op_5168_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5168_cast_fp16 = einsum(equation = var_5168_equation_0, values = (var_5010_cast_fp16, var_4927_cast_fp16))[name = tensor("op_5168_cast_fp16")]; tensor var_5169_to_fp16 = const()[name = tensor("op_5169_to_fp16"), val = tensor(0x1p-3)]; tensor aw_325_cast_fp16 = mul(x = var_5168_cast_fp16, y = var_5169_to_fp16)[name = tensor("aw_325_cast_fp16")]; tensor var_5172_equation_0 = const()[name = tensor("op_5172_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5172_cast_fp16 = einsum(equation = var_5172_equation_0, values = (var_5014_cast_fp16, var_4931_cast_fp16))[name = tensor("op_5172_cast_fp16")]; tensor var_5173_to_fp16 = const()[name = tensor("op_5173_to_fp16"), val = tensor(0x1p-3)]; tensor aw_327_cast_fp16 = mul(x = var_5172_cast_fp16, y = var_5173_to_fp16)[name = tensor("aw_327_cast_fp16")]; tensor var_5176_equation_0 = const()[name = tensor("op_5176_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5176_cast_fp16 = einsum(equation = var_5176_equation_0, values = (var_5018_cast_fp16, var_4935_cast_fp16))[name = tensor("op_5176_cast_fp16")]; tensor var_5177_to_fp16 = const()[name = tensor("op_5177_to_fp16"), val = tensor(0x1p-3)]; tensor aw_329_cast_fp16 = mul(x = var_5176_cast_fp16, y = var_5177_to_fp16)[name = tensor("aw_329_cast_fp16")]; tensor var_5180_equation_0 = const()[name = tensor("op_5180_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5180_cast_fp16 = einsum(equation = var_5180_equation_0, values = (var_5022_cast_fp16, var_4939_cast_fp16))[name = tensor("op_5180_cast_fp16")]; tensor var_5181_to_fp16 = const()[name = tensor("op_5181_to_fp16"), val = tensor(0x1p-3)]; tensor aw_331_cast_fp16 = mul(x = var_5180_cast_fp16, y = var_5181_to_fp16)[name = tensor("aw_331_cast_fp16")]; tensor var_5184_equation_0 = const()[name = tensor("op_5184_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5184_cast_fp16 = einsum(equation = var_5184_equation_0, values = (var_5026_cast_fp16, var_4943_cast_fp16))[name = tensor("op_5184_cast_fp16")]; tensor var_5185_to_fp16 = const()[name = tensor("op_5185_to_fp16"), val = tensor(0x1p-3)]; tensor aw_333_cast_fp16 = mul(x = var_5184_cast_fp16, y = var_5185_to_fp16)[name = tensor("aw_333_cast_fp16")]; tensor var_5188_equation_0 = const()[name = tensor("op_5188_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5188_cast_fp16 = einsum(equation = var_5188_equation_0, values = (var_5030_cast_fp16, var_4947_cast_fp16))[name = tensor("op_5188_cast_fp16")]; tensor var_5189_to_fp16 = const()[name = tensor("op_5189_to_fp16"), val = tensor(0x1p-3)]; tensor aw_335_cast_fp16 = mul(x = var_5188_cast_fp16, y = var_5189_to_fp16)[name = tensor("aw_335_cast_fp16")]; tensor var_5192_equation_0 = const()[name = tensor("op_5192_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5192_cast_fp16 = einsum(equation = var_5192_equation_0, values = (var_5034_cast_fp16, var_4951_cast_fp16))[name = tensor("op_5192_cast_fp16")]; tensor var_5193_to_fp16 = const()[name = tensor("op_5193_to_fp16"), val = tensor(0x1p-3)]; tensor aw_337_cast_fp16 = mul(x = var_5192_cast_fp16, y = var_5193_to_fp16)[name = tensor("aw_337_cast_fp16")]; tensor var_5196_equation_0 = const()[name = tensor("op_5196_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5196_cast_fp16 = einsum(equation = var_5196_equation_0, values = (var_5038_cast_fp16, var_4955_cast_fp16))[name = tensor("op_5196_cast_fp16")]; tensor var_5197_to_fp16 = const()[name = tensor("op_5197_to_fp16"), val = tensor(0x1p-3)]; tensor aw_339_cast_fp16 = mul(x = var_5196_cast_fp16, y = var_5197_to_fp16)[name = tensor("aw_339_cast_fp16")]; tensor var_5200_equation_0 = const()[name = tensor("op_5200_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5200_cast_fp16 = einsum(equation = var_5200_equation_0, values = (var_5042_cast_fp16, var_4959_cast_fp16))[name = tensor("op_5200_cast_fp16")]; tensor var_5201_to_fp16 = const()[name = tensor("op_5201_to_fp16"), val = tensor(0x1p-3)]; tensor aw_341_cast_fp16 = mul(x = var_5200_cast_fp16, y = var_5201_to_fp16)[name = tensor("aw_341_cast_fp16")]; tensor var_5204_equation_0 = const()[name = tensor("op_5204_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5204_cast_fp16 = einsum(equation = var_5204_equation_0, values = (var_5046_cast_fp16, var_4963_cast_fp16))[name = tensor("op_5204_cast_fp16")]; tensor var_5205_to_fp16 = const()[name = tensor("op_5205_to_fp16"), val = tensor(0x1p-3)]; tensor aw_343_cast_fp16 = mul(x = var_5204_cast_fp16, y = var_5205_to_fp16)[name = tensor("aw_343_cast_fp16")]; tensor var_5208_equation_0 = const()[name = tensor("op_5208_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5208_cast_fp16 = einsum(equation = var_5208_equation_0, values = (var_5050_cast_fp16, var_4967_cast_fp16))[name = tensor("op_5208_cast_fp16")]; tensor var_5209_to_fp16 = const()[name = tensor("op_5209_to_fp16"), val = tensor(0x1p-3)]; tensor aw_345_cast_fp16 = mul(x = var_5208_cast_fp16, y = var_5209_to_fp16)[name = tensor("aw_345_cast_fp16")]; tensor var_5212_equation_0 = const()[name = tensor("op_5212_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5212_cast_fp16 = einsum(equation = var_5212_equation_0, values = (var_5054_cast_fp16, var_4971_cast_fp16))[name = tensor("op_5212_cast_fp16")]; tensor var_5213_to_fp16 = const()[name = tensor("op_5213_to_fp16"), val = tensor(0x1p-3)]; tensor aw_347_cast_fp16 = mul(x = var_5212_cast_fp16, y = var_5213_to_fp16)[name = tensor("aw_347_cast_fp16")]; tensor var_5216_equation_0 = const()[name = tensor("op_5216_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5216_cast_fp16 = einsum(equation = var_5216_equation_0, values = (var_5058_cast_fp16, var_4975_cast_fp16))[name = tensor("op_5216_cast_fp16")]; tensor var_5217_to_fp16 = const()[name = tensor("op_5217_to_fp16"), val = tensor(0x1p-3)]; tensor aw_349_cast_fp16 = mul(x = var_5216_cast_fp16, y = var_5217_to_fp16)[name = tensor("aw_349_cast_fp16")]; tensor var_5220_equation_0 = const()[name = tensor("op_5220_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5220_cast_fp16 = einsum(equation = var_5220_equation_0, values = (var_5062_cast_fp16, var_4979_cast_fp16))[name = tensor("op_5220_cast_fp16")]; tensor var_5221_to_fp16 = const()[name = tensor("op_5221_to_fp16"), val = tensor(0x1p-3)]; tensor aw_351_cast_fp16 = mul(x = var_5220_cast_fp16, y = var_5221_to_fp16)[name = tensor("aw_351_cast_fp16")]; tensor var_5224_equation_0 = const()[name = tensor("op_5224_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5224_cast_fp16 = einsum(equation = var_5224_equation_0, values = (var_5066_cast_fp16, var_4983_cast_fp16))[name = tensor("op_5224_cast_fp16")]; tensor var_5225_to_fp16 = const()[name = tensor("op_5225_to_fp16"), val = tensor(0x1p-3)]; tensor aw_353_cast_fp16 = mul(x = var_5224_cast_fp16, y = var_5225_to_fp16)[name = tensor("aw_353_cast_fp16")]; tensor var_5228_equation_0 = const()[name = tensor("op_5228_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5228_cast_fp16 = einsum(equation = var_5228_equation_0, values = (var_5070_cast_fp16, var_4987_cast_fp16))[name = tensor("op_5228_cast_fp16")]; tensor var_5229_to_fp16 = const()[name = tensor("op_5229_to_fp16"), val = tensor(0x1p-3)]; tensor aw_355_cast_fp16 = mul(x = var_5228_cast_fp16, y = var_5229_to_fp16)[name = tensor("aw_355_cast_fp16")]; tensor var_5232_equation_0 = const()[name = tensor("op_5232_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5232_cast_fp16 = einsum(equation = var_5232_equation_0, values = (var_5074_cast_fp16, var_4991_cast_fp16))[name = tensor("op_5232_cast_fp16")]; tensor var_5233_to_fp16 = const()[name = tensor("op_5233_to_fp16"), val = tensor(0x1p-3)]; tensor aw_357_cast_fp16 = mul(x = var_5232_cast_fp16, y = var_5233_to_fp16)[name = tensor("aw_357_cast_fp16")]; tensor var_5236_equation_0 = const()[name = tensor("op_5236_equation_0"), val = tensor("bkhc,bchq->bkhq")]; tensor var_5236_cast_fp16 = einsum(equation = var_5236_equation_0, values = (var_5078_cast_fp16, var_4995_cast_fp16))[name = tensor("op_5236_cast_fp16")]; tensor var_5237_to_fp16 = const()[name = tensor("op_5237_to_fp16"), val = tensor(0x1p-3)]; tensor aw_359_cast_fp16 = mul(x = var_5236_cast_fp16, y = var_5237_to_fp16)[name = tensor("aw_359_cast_fp16")]; tensor var_5239_cast_fp16 = softmax(axis = var_4371, x = aw_321_cast_fp16)[name = tensor("op_5239_cast_fp16")]; tensor var_5240_cast_fp16 = softmax(axis = var_4371, x = aw_323_cast_fp16)[name = tensor("op_5240_cast_fp16")]; tensor var_5241_cast_fp16 = softmax(axis = var_4371, x = aw_325_cast_fp16)[name = tensor("op_5241_cast_fp16")]; tensor var_5242_cast_fp16 = softmax(axis = var_4371, x = aw_327_cast_fp16)[name = tensor("op_5242_cast_fp16")]; tensor var_5243_cast_fp16 = softmax(axis = var_4371, x = aw_329_cast_fp16)[name = tensor("op_5243_cast_fp16")]; tensor var_5244_cast_fp16 = softmax(axis = var_4371, x = aw_331_cast_fp16)[name = tensor("op_5244_cast_fp16")]; tensor var_5245_cast_fp16 = softmax(axis = var_4371, x = aw_333_cast_fp16)[name = tensor("op_5245_cast_fp16")]; tensor var_5246_cast_fp16 = softmax(axis = var_4371, x = aw_335_cast_fp16)[name = tensor("op_5246_cast_fp16")]; tensor var_5247_cast_fp16 = softmax(axis = var_4371, x = aw_337_cast_fp16)[name = tensor("op_5247_cast_fp16")]; tensor var_5248_cast_fp16 = softmax(axis = var_4371, x = aw_339_cast_fp16)[name = tensor("op_5248_cast_fp16")]; tensor var_5249_cast_fp16 = softmax(axis = var_4371, x = aw_341_cast_fp16)[name = tensor("op_5249_cast_fp16")]; tensor var_5250_cast_fp16 = softmax(axis = var_4371, x = aw_343_cast_fp16)[name = tensor("op_5250_cast_fp16")]; tensor var_5251_cast_fp16 = softmax(axis = var_4371, x = aw_345_cast_fp16)[name = tensor("op_5251_cast_fp16")]; tensor var_5252_cast_fp16 = softmax(axis = var_4371, x = aw_347_cast_fp16)[name = tensor("op_5252_cast_fp16")]; tensor var_5253_cast_fp16 = softmax(axis = var_4371, x = aw_349_cast_fp16)[name = tensor("op_5253_cast_fp16")]; tensor var_5254_cast_fp16 = softmax(axis = var_4371, x = aw_351_cast_fp16)[name = tensor("op_5254_cast_fp16")]; tensor var_5255_cast_fp16 = softmax(axis = var_4371, x = aw_353_cast_fp16)[name = tensor("op_5255_cast_fp16")]; tensor var_5256_cast_fp16 = softmax(axis = var_4371, x = aw_355_cast_fp16)[name = tensor("op_5256_cast_fp16")]; tensor var_5257_cast_fp16 = softmax(axis = var_4371, x = aw_357_cast_fp16)[name = tensor("op_5257_cast_fp16")]; tensor var_5258_cast_fp16 = softmax(axis = var_4371, x = aw_359_cast_fp16)[name = tensor("op_5258_cast_fp16")]; tensor var_5260_equation_0 = const()[name = tensor("op_5260_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5260_cast_fp16 = einsum(equation = var_5260_equation_0, values = (var_5080_cast_fp16, var_5239_cast_fp16))[name = tensor("op_5260_cast_fp16")]; tensor var_5262_equation_0 = const()[name = tensor("op_5262_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5262_cast_fp16 = einsum(equation = var_5262_equation_0, values = (var_5084_cast_fp16, var_5240_cast_fp16))[name = tensor("op_5262_cast_fp16")]; tensor var_5264_equation_0 = const()[name = tensor("op_5264_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5264_cast_fp16 = einsum(equation = var_5264_equation_0, values = (var_5088_cast_fp16, var_5241_cast_fp16))[name = tensor("op_5264_cast_fp16")]; tensor var_5266_equation_0 = const()[name = tensor("op_5266_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5266_cast_fp16 = einsum(equation = var_5266_equation_0, values = (var_5092_cast_fp16, var_5242_cast_fp16))[name = tensor("op_5266_cast_fp16")]; tensor var_5268_equation_0 = const()[name = tensor("op_5268_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5268_cast_fp16 = einsum(equation = var_5268_equation_0, values = (var_5096_cast_fp16, var_5243_cast_fp16))[name = tensor("op_5268_cast_fp16")]; tensor var_5270_equation_0 = const()[name = tensor("op_5270_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5270_cast_fp16 = einsum(equation = var_5270_equation_0, values = (var_5100_cast_fp16, var_5244_cast_fp16))[name = tensor("op_5270_cast_fp16")]; tensor var_5272_equation_0 = const()[name = tensor("op_5272_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5272_cast_fp16 = einsum(equation = var_5272_equation_0, values = (var_5104_cast_fp16, var_5245_cast_fp16))[name = tensor("op_5272_cast_fp16")]; tensor var_5274_equation_0 = const()[name = tensor("op_5274_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5274_cast_fp16 = einsum(equation = var_5274_equation_0, values = (var_5108_cast_fp16, var_5246_cast_fp16))[name = tensor("op_5274_cast_fp16")]; tensor var_5276_equation_0 = const()[name = tensor("op_5276_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5276_cast_fp16 = einsum(equation = var_5276_equation_0, values = (var_5112_cast_fp16, var_5247_cast_fp16))[name = tensor("op_5276_cast_fp16")]; tensor var_5278_equation_0 = const()[name = tensor("op_5278_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5278_cast_fp16 = einsum(equation = var_5278_equation_0, values = (var_5116_cast_fp16, var_5248_cast_fp16))[name = tensor("op_5278_cast_fp16")]; tensor var_5280_equation_0 = const()[name = tensor("op_5280_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5280_cast_fp16 = einsum(equation = var_5280_equation_0, values = (var_5120_cast_fp16, var_5249_cast_fp16))[name = tensor("op_5280_cast_fp16")]; tensor var_5282_equation_0 = const()[name = tensor("op_5282_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5282_cast_fp16 = einsum(equation = var_5282_equation_0, values = (var_5124_cast_fp16, var_5250_cast_fp16))[name = tensor("op_5282_cast_fp16")]; tensor var_5284_equation_0 = const()[name = tensor("op_5284_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5284_cast_fp16 = einsum(equation = var_5284_equation_0, values = (var_5128_cast_fp16, var_5251_cast_fp16))[name = tensor("op_5284_cast_fp16")]; tensor var_5286_equation_0 = const()[name = tensor("op_5286_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5286_cast_fp16 = einsum(equation = var_5286_equation_0, values = (var_5132_cast_fp16, var_5252_cast_fp16))[name = tensor("op_5286_cast_fp16")]; tensor var_5288_equation_0 = const()[name = tensor("op_5288_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5288_cast_fp16 = einsum(equation = var_5288_equation_0, values = (var_5136_cast_fp16, var_5253_cast_fp16))[name = tensor("op_5288_cast_fp16")]; tensor var_5290_equation_0 = const()[name = tensor("op_5290_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5290_cast_fp16 = einsum(equation = var_5290_equation_0, values = (var_5140_cast_fp16, var_5254_cast_fp16))[name = tensor("op_5290_cast_fp16")]; tensor var_5292_equation_0 = const()[name = tensor("op_5292_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5292_cast_fp16 = einsum(equation = var_5292_equation_0, values = (var_5144_cast_fp16, var_5255_cast_fp16))[name = tensor("op_5292_cast_fp16")]; tensor var_5294_equation_0 = const()[name = tensor("op_5294_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5294_cast_fp16 = einsum(equation = var_5294_equation_0, values = (var_5148_cast_fp16, var_5256_cast_fp16))[name = tensor("op_5294_cast_fp16")]; tensor var_5296_equation_0 = const()[name = tensor("op_5296_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5296_cast_fp16 = einsum(equation = var_5296_equation_0, values = (var_5152_cast_fp16, var_5257_cast_fp16))[name = tensor("op_5296_cast_fp16")]; tensor var_5298_equation_0 = const()[name = tensor("op_5298_equation_0"), val = tensor("bchk,bkhq->bchq")]; tensor var_5298_cast_fp16 = einsum(equation = var_5298_equation_0, values = (var_5156_cast_fp16, var_5258_cast_fp16))[name = tensor("op_5298_cast_fp16")]; tensor input_217_interleave_0 = const()[name = tensor("input_217_interleave_0"), val = tensor(false)]; tensor input_217_cast_fp16 = concat(axis = var_4371, interleave = input_217_interleave_0, values = (var_5260_cast_fp16, var_5262_cast_fp16, var_5264_cast_fp16, var_5266_cast_fp16, var_5268_cast_fp16, var_5270_cast_fp16, var_5272_cast_fp16, var_5274_cast_fp16, var_5276_cast_fp16, var_5278_cast_fp16, var_5280_cast_fp16, var_5282_cast_fp16, var_5284_cast_fp16, var_5286_cast_fp16, var_5288_cast_fp16, var_5290_cast_fp16, var_5292_cast_fp16, var_5294_cast_fp16, var_5296_cast_fp16, var_5298_cast_fp16))[name = tensor("input_217_cast_fp16")]; tensor var_5304 = const()[name = tensor("op_5304"), val = tensor([1, 1])]; tensor var_5306 = const()[name = tensor("op_5306"), val = tensor([1, 1])]; tensor var_5308_pad_type_0 = const()[name = tensor("op_5308_pad_type_0"), val = tensor("custom")]; tensor var_5308_pad_0 = const()[name = tensor("op_5308_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(595166144)))]; tensor mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(598443008)))]; tensor var_5308_cast_fp16 = conv(bias = mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_bias_to_fp16, dilations = var_5306, groups = var_4371, pad = var_5308_pad_0, pad_type = var_5308_pad_type_0, strides = var_5304, weight = mid_block_attentions_0_transformer_blocks_0_attn2_to_out_0_weight_to_fp16, x = input_217_cast_fp16)[name = tensor("op_5308_cast_fp16")]; tensor inputs_41_cast_fp16 = add(x = var_5308_cast_fp16, y = inputs_39_cast_fp16)[name = tensor("inputs_41_cast_fp16")]; tensor var_5312 = const()[name = tensor("op_5312"), val = tensor([1])]; tensor channels_mean_41_cast_fp16 = reduce_mean(axes = var_5312, keep_dims = var_4366, x = inputs_41_cast_fp16)[name = tensor("channels_mean_41_cast_fp16")]; tensor zero_mean_41_cast_fp16 = sub(x = inputs_41_cast_fp16, y = channels_mean_41_cast_fp16)[name = tensor("zero_mean_41_cast_fp16")]; tensor zero_mean_sq_41_cast_fp16 = mul(x = zero_mean_41_cast_fp16, y = zero_mean_41_cast_fp16)[name = tensor("zero_mean_sq_41_cast_fp16")]; tensor var_5316 = const()[name = tensor("op_5316"), val = tensor([1])]; tensor var_5317_cast_fp16 = reduce_mean(axes = var_5316, keep_dims = var_4366, x = zero_mean_sq_41_cast_fp16)[name = tensor("op_5317_cast_fp16")]; tensor var_5318_to_fp16 = const()[name = tensor("op_5318_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_5319_cast_fp16 = add(x = var_5317_cast_fp16, y = var_5318_to_fp16)[name = tensor("op_5319_cast_fp16")]; tensor denom_41_epsilon_0_to_fp16 = const()[name = tensor("denom_41_epsilon_0_to_fp16"), val = tensor(0x1p-24)]; tensor denom_41_cast_fp16 = rsqrt(epsilon = denom_41_epsilon_0_to_fp16, x = var_5319_cast_fp16)[name = tensor("denom_41_cast_fp16")]; tensor out_41_cast_fp16 = mul(x = zero_mean_41_cast_fp16, y = denom_41_cast_fp16)[name = tensor("out_41_cast_fp16")]; tensor var_5323_to_fp16 = const()[name = tensor("op_5323_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(598445632)))]; tensor var_5324_cast_fp16 = add(x = out_41_cast_fp16, y = var_5323_to_fp16)[name = tensor("op_5324_cast_fp16")]; tensor var_5326_to_fp16 = const()[name = tensor("op_5326_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(598448256)))]; tensor input_219_cast_fp16 = mul(x = var_5324_cast_fp16, y = var_5326_to_fp16)[name = tensor("input_219_cast_fp16")]; tensor var_5334 = const()[name = tensor("op_5334"), val = tensor([1, 1])]; tensor var_5336 = const()[name = tensor("op_5336"), val = tensor([1, 1])]; tensor var_5338_pad_type_0 = const()[name = tensor("op_5338_pad_type_0"), val = tensor("custom")]; tensor var_5338_pad_0 = const()[name = tensor("op_5338_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(598450880)))]; tensor mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(624665344)))]; tensor var_5338_cast_fp16 = conv(bias = mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_bias_to_fp16, dilations = var_5336, groups = var_4371, pad = var_5338_pad_0, pad_type = var_5338_pad_type_0, strides = var_5334, weight = mid_block_attentions_0_transformer_blocks_0_ff_net_0_proj_weight_to_fp16, x = input_219_cast_fp16)[name = tensor("op_5338_cast_fp16")]; tensor var_5339_split_sizes_0 = const()[name = tensor("op_5339_split_sizes_0"), val = tensor([5120, 5120])]; tensor var_5339_axis_0 = const()[name = tensor("op_5339_axis_0"), val = tensor(1)]; tensor var_5339_cast_fp16_0, tensor var_5339_cast_fp16_1 = split(axis = var_5339_axis_0, split_sizes = var_5339_split_sizes_0, x = var_5338_cast_fp16)[name = tensor("op_5339_cast_fp16")]; tensor var_5341_mode_0 = const()[name = tensor("op_5341_mode_0"), val = tensor("EXACT")]; tensor var_5341_cast_fp16 = gelu(mode = var_5341_mode_0, x = var_5339_cast_fp16_1)[name = tensor("op_5341_cast_fp16")]; tensor input_221_cast_fp16 = mul(x = var_5339_cast_fp16_0, y = var_5341_cast_fp16)[name = tensor("input_221_cast_fp16")]; tensor var_5345 = const()[name = tensor("op_5345"), val = tensor([1, 1])]; tensor var_5347 = const()[name = tensor("op_5347"), val = tensor([1, 1])]; tensor var_5349_pad_type_0 = const()[name = tensor("op_5349_pad_type_0"), val = tensor("custom")]; tensor var_5349_pad_0 = const()[name = tensor("op_5349_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(624685888)))]; tensor mid_block_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(637793152)))]; tensor var_5349_cast_fp16 = conv(bias = mid_block_attentions_0_transformer_blocks_0_ff_net_2_bias_to_fp16, dilations = var_5347, groups = var_4371, pad = var_5349_pad_0, pad_type = var_5349_pad_type_0, strides = var_5345, weight = mid_block_attentions_0_transformer_blocks_0_ff_net_2_weight_to_fp16, x = input_221_cast_fp16)[name = tensor("op_5349_cast_fp16")]; tensor hidden_states_131_cast_fp16 = add(x = var_5349_cast_fp16, y = inputs_41_cast_fp16)[name = tensor("hidden_states_131_cast_fp16")]; tensor var_5351 = const()[name = tensor("op_5351"), val = tensor([2, 1280, 6, 6])]; tensor input_223_cast_fp16 = reshape(shape = var_5351, x = hidden_states_131_cast_fp16)[name = tensor("input_223_cast_fp16")]; tensor var_5355 = const()[name = tensor("op_5355"), val = tensor([1, 1])]; tensor var_5357 = const()[name = tensor("op_5357"), val = tensor([1, 1])]; tensor hidden_states_133_pad_type_0 = const()[name = tensor("hidden_states_133_pad_type_0"), val = tensor("custom")]; tensor hidden_states_133_pad_0 = const()[name = tensor("hidden_states_133_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_attentions_0_proj_out_weight_to_fp16 = const()[name = tensor("mid_block_attentions_0_proj_out_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(637795776)))]; tensor mid_block_attentions_0_proj_out_bias_to_fp16 = const()[name = tensor("mid_block_attentions_0_proj_out_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641072640)))]; tensor hidden_states_133_cast_fp16 = conv(bias = mid_block_attentions_0_proj_out_bias_to_fp16, dilations = var_5357, groups = var_4371, pad = hidden_states_133_pad_0, pad_type = hidden_states_133_pad_type_0, strides = var_5355, weight = mid_block_attentions_0_proj_out_weight_to_fp16, x = input_223_cast_fp16)[name = tensor("hidden_states_133_cast_fp16")]; tensor input_225_cast_fp16 = add(x = hidden_states_133_cast_fp16, y = hidden_states_121_cast_fp16)[name = tensor("input_225_cast_fp16")]; tensor reshape_100_shape_0 = const()[name = tensor("reshape_100_shape_0"), val = tensor([2, 32, 40, 6, 6])]; tensor reshape_100_cast_fp16 = reshape(shape = reshape_100_shape_0, x = input_225_cast_fp16)[name = tensor("reshape_100_cast_fp16")]; tensor reduce_mean_75_axes_0 = const()[name = tensor("reduce_mean_75_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_75_keep_dims_0 = const()[name = tensor("reduce_mean_75_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_75_cast_fp16 = reduce_mean(axes = reduce_mean_75_axes_0, keep_dims = reduce_mean_75_keep_dims_0, x = reshape_100_cast_fp16)[name = tensor("reduce_mean_75_cast_fp16")]; tensor sub_50_cast_fp16 = sub(x = reshape_100_cast_fp16, y = reduce_mean_75_cast_fp16)[name = tensor("sub_50_cast_fp16")]; tensor square_25_cast_fp16 = square(x = sub_50_cast_fp16)[name = tensor("square_25_cast_fp16")]; tensor reduce_mean_77_axes_0 = const()[name = tensor("reduce_mean_77_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_77_keep_dims_0 = const()[name = tensor("reduce_mean_77_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_77_cast_fp16 = reduce_mean(axes = reduce_mean_77_axes_0, keep_dims = reduce_mean_77_keep_dims_0, x = square_25_cast_fp16)[name = tensor("reduce_mean_77_cast_fp16")]; tensor add_50_y_0_to_fp16 = const()[name = tensor("add_50_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_50_cast_fp16 = add(x = reduce_mean_77_cast_fp16, y = add_50_y_0_to_fp16)[name = tensor("add_50_cast_fp16")]; tensor sqrt_25_cast_fp16 = sqrt(x = add_50_cast_fp16)[name = tensor("sqrt_25_cast_fp16")]; tensor real_div_25_cast_fp16 = real_div(x = sub_50_cast_fp16, y = sqrt_25_cast_fp16)[name = tensor("real_div_25_cast_fp16")]; tensor reshape_101_shape_0 = const()[name = tensor("reshape_101_shape_0"), val = tensor([2, 1280, 6, 6])]; tensor reshape_101_cast_fp16 = reshape(shape = reshape_101_shape_0, x = real_div_25_cast_fp16)[name = tensor("reshape_101_cast_fp16")]; tensor add_51_gamma_0_to_fp16 = const()[name = tensor("add_51_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641075264)))]; tensor add_51_beta_0_to_fp16 = const()[name = tensor("add_51_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641077888)))]; tensor add_51_epsilon_0_to_fp16 = const()[name = tensor("add_51_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_51_cast_fp16 = batch_norm(beta = add_51_beta_0_to_fp16, epsilon = add_51_epsilon_0_to_fp16, gamma = add_51_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_101_cast_fp16)[name = tensor("add_51_cast_fp16")]; tensor input_229_cast_fp16 = silu(x = add_51_cast_fp16)[name = tensor("input_229_cast_fp16")]; tensor var_5372 = const()[name = tensor("op_5372"), val = tensor([1, 1])]; tensor var_5374 = const()[name = tensor("op_5374"), val = tensor([1, 1])]; tensor hidden_states_135_pad_type_0 = const()[name = tensor("hidden_states_135_pad_type_0"), val = tensor("custom")]; tensor hidden_states_135_pad_0 = const()[name = tensor("hidden_states_135_pad_0"), val = tensor([1, 1, 1, 1])]; tensor mid_block_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("mid_block_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(641080512)))]; tensor mid_block_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("mid_block_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(670571776)))]; tensor hidden_states_135_cast_fp16 = conv(bias = mid_block_resnets_1_conv1_bias_to_fp16, dilations = var_5374, groups = var_4371, pad = hidden_states_135_pad_0, pad_type = hidden_states_135_pad_type_0, strides = var_5372, weight = mid_block_resnets_1_conv1_weight_to_fp16, x = input_229_cast_fp16)[name = tensor("hidden_states_135_cast_fp16")]; tensor var_5380 = const()[name = tensor("op_5380"), val = tensor([1, 1])]; tensor var_5382 = const()[name = tensor("op_5382"), val = tensor([1, 1])]; tensor temb_19_pad_type_0 = const()[name = tensor("temb_19_pad_type_0"), val = tensor("custom")]; tensor temb_19_pad_0 = const()[name = tensor("temb_19_pad_0"), val = tensor([0, 0, 0, 0])]; tensor mid_block_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("mid_block_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(670574400)))]; tensor mid_block_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("mid_block_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(673851264)))]; tensor temb_19_cast_fp16 = conv(bias = mid_block_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_5382, groups = var_4371, pad = temb_19_pad_0, pad_type = temb_19_pad_type_0, strides = var_5380, weight = mid_block_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_19_cast_fp16")]; tensor input_233_cast_fp16 = add(x = hidden_states_135_cast_fp16, y = temb_19_cast_fp16)[name = tensor("input_233_cast_fp16")]; tensor reshape_104_shape_0 = const()[name = tensor("reshape_104_shape_0"), val = tensor([2, 32, 40, 6, 6])]; tensor reshape_104_cast_fp16 = reshape(shape = reshape_104_shape_0, x = input_233_cast_fp16)[name = tensor("reshape_104_cast_fp16")]; tensor reduce_mean_78_axes_0 = const()[name = tensor("reduce_mean_78_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_78_keep_dims_0 = const()[name = tensor("reduce_mean_78_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_78_cast_fp16 = reduce_mean(axes = reduce_mean_78_axes_0, keep_dims = reduce_mean_78_keep_dims_0, x = reshape_104_cast_fp16)[name = tensor("reduce_mean_78_cast_fp16")]; tensor sub_52_cast_fp16 = sub(x = reshape_104_cast_fp16, y = reduce_mean_78_cast_fp16)[name = tensor("sub_52_cast_fp16")]; tensor square_26_cast_fp16 = square(x = sub_52_cast_fp16)[name = tensor("square_26_cast_fp16")]; tensor reduce_mean_80_axes_0 = const()[name = tensor("reduce_mean_80_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_80_keep_dims_0 = const()[name = tensor("reduce_mean_80_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_80_cast_fp16 = reduce_mean(axes = reduce_mean_80_axes_0, keep_dims = reduce_mean_80_keep_dims_0, x = square_26_cast_fp16)[name = tensor("reduce_mean_80_cast_fp16")]; tensor add_52_y_0_to_fp16 = const()[name = tensor("add_52_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_52_cast_fp16 = add(x = reduce_mean_80_cast_fp16, y = add_52_y_0_to_fp16)[name = tensor("add_52_cast_fp16")]; tensor sqrt_26_cast_fp16 = sqrt(x = add_52_cast_fp16)[name = tensor("sqrt_26_cast_fp16")]; tensor real_div_26_cast_fp16 = real_div(x = sub_52_cast_fp16, y = sqrt_26_cast_fp16)[name = tensor("real_div_26_cast_fp16")]; tensor reshape_105_shape_0 = const()[name = tensor("reshape_105_shape_0"), val = tensor([2, 1280, 6, 6])]; tensor reshape_105_cast_fp16 = reshape(shape = reshape_105_shape_0, x = real_div_26_cast_fp16)[name = tensor("reshape_105_cast_fp16")]; tensor add_53_gamma_0_to_fp16 = const()[name = tensor("add_53_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(673853888)))]; tensor add_53_beta_0_to_fp16 = const()[name = tensor("add_53_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(673856512)))]; tensor add_53_epsilon_0_to_fp16 = const()[name = tensor("add_53_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_53_cast_fp16 = batch_norm(beta = add_53_beta_0_to_fp16, epsilon = add_53_epsilon_0_to_fp16, gamma = add_53_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_105_cast_fp16)[name = tensor("add_53_cast_fp16")]; tensor input_237_cast_fp16 = silu(x = add_53_cast_fp16)[name = tensor("input_237_cast_fp16")]; tensor var_5392 = const()[name = tensor("op_5392"), val = tensor([1, 1])]; tensor var_5394 = const()[name = tensor("op_5394"), val = tensor([1, 1])]; tensor hidden_states_137_pad_type_0 = const()[name = tensor("hidden_states_137_pad_type_0"), val = tensor("custom")]; tensor hidden_states_137_pad_0 = const()[name = tensor("hidden_states_137_pad_0"), val = tensor([1, 1, 1, 1])]; tensor mid_block_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("mid_block_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(673859136)))]; tensor mid_block_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("mid_block_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703350400)))]; tensor hidden_states_137_cast_fp16 = conv(bias = mid_block_resnets_1_conv2_bias_to_fp16, dilations = var_5394, groups = var_4371, pad = hidden_states_137_pad_0, pad_type = hidden_states_137_pad_type_0, strides = var_5392, weight = mid_block_resnets_1_conv2_weight_to_fp16, x = input_237_cast_fp16)[name = tensor("hidden_states_137_cast_fp16")]; tensor hidden_states_139_cast_fp16 = add(x = input_225_cast_fp16, y = hidden_states_137_cast_fp16)[name = tensor("hidden_states_139_cast_fp16")]; tensor var_5405 = const()[name = tensor("op_5405"), val = tensor(1)]; tensor input_239_interleave_0 = const()[name = tensor("input_239_interleave_0"), val = tensor(false)]; tensor input_239_cast_fp16 = concat(axis = var_5405, interleave = input_239_interleave_0, values = (hidden_states_139_cast_fp16, input_199_cast_fp16))[name = tensor("input_239_cast_fp16")]; tensor reshape_108_shape_0 = const()[name = tensor("reshape_108_shape_0"), val = tensor([2, 32, 80, 6, 6])]; tensor reshape_108_cast_fp16 = reshape(shape = reshape_108_shape_0, x = input_239_cast_fp16)[name = tensor("reshape_108_cast_fp16")]; tensor reduce_mean_81_axes_0 = const()[name = tensor("reduce_mean_81_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_81_keep_dims_0 = const()[name = tensor("reduce_mean_81_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_81_cast_fp16 = reduce_mean(axes = reduce_mean_81_axes_0, keep_dims = reduce_mean_81_keep_dims_0, x = reshape_108_cast_fp16)[name = tensor("reduce_mean_81_cast_fp16")]; tensor sub_54_cast_fp16 = sub(x = reshape_108_cast_fp16, y = reduce_mean_81_cast_fp16)[name = tensor("sub_54_cast_fp16")]; tensor square_27_cast_fp16 = square(x = sub_54_cast_fp16)[name = tensor("square_27_cast_fp16")]; tensor reduce_mean_83_axes_0 = const()[name = tensor("reduce_mean_83_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_83_keep_dims_0 = const()[name = tensor("reduce_mean_83_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_83_cast_fp16 = reduce_mean(axes = reduce_mean_83_axes_0, keep_dims = reduce_mean_83_keep_dims_0, x = square_27_cast_fp16)[name = tensor("reduce_mean_83_cast_fp16")]; tensor add_54_y_0_to_fp16 = const()[name = tensor("add_54_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_54_cast_fp16 = add(x = reduce_mean_83_cast_fp16, y = add_54_y_0_to_fp16)[name = tensor("add_54_cast_fp16")]; tensor sqrt_27_cast_fp16 = sqrt(x = add_54_cast_fp16)[name = tensor("sqrt_27_cast_fp16")]; tensor real_div_27_cast_fp16 = real_div(x = sub_54_cast_fp16, y = sqrt_27_cast_fp16)[name = tensor("real_div_27_cast_fp16")]; tensor reshape_109_shape_0 = const()[name = tensor("reshape_109_shape_0"), val = tensor([2, 2560, 6, 6])]; tensor reshape_109_cast_fp16 = reshape(shape = reshape_109_shape_0, x = real_div_27_cast_fp16)[name = tensor("reshape_109_cast_fp16")]; tensor add_55_mean_0_to_fp16 = const()[name = tensor("add_55_mean_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703353024)))]; tensor add_55_variance_0_to_fp16 = const()[name = tensor("add_55_variance_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703358208)))]; tensor add_55_gamma_0_to_fp16 = const()[name = tensor("add_55_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703363392)))]; tensor add_55_beta_0_to_fp16 = const()[name = tensor("add_55_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703368576)))]; tensor add_55_epsilon_0_to_fp16 = const()[name = tensor("add_55_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_55_cast_fp16 = batch_norm(beta = add_55_beta_0_to_fp16, epsilon = add_55_epsilon_0_to_fp16, gamma = add_55_gamma_0_to_fp16, mean = add_55_mean_0_to_fp16, variance = add_55_variance_0_to_fp16, x = reshape_109_cast_fp16)[name = tensor("add_55_cast_fp16")]; tensor input_243_cast_fp16 = silu(x = add_55_cast_fp16)[name = tensor("input_243_cast_fp16")]; tensor var_5428 = const()[name = tensor("op_5428"), val = tensor([1, 1])]; tensor var_5430 = const()[name = tensor("op_5430"), val = tensor([1, 1])]; tensor hidden_states_141_pad_type_0 = const()[name = tensor("hidden_states_141_pad_type_0"), val = tensor("custom")]; tensor hidden_states_141_pad_0 = const()[name = tensor("hidden_states_141_pad_0"), val = tensor([1, 1, 1, 1])]; tensor up_blocks_0_resnets_0_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(703373760)))]; tensor up_blocks_0_resnets_0_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762356224)))]; tensor hidden_states_141_cast_fp16 = conv(bias = up_blocks_0_resnets_0_conv1_bias_to_fp16, dilations = var_5430, groups = var_5405, pad = hidden_states_141_pad_0, pad_type = hidden_states_141_pad_type_0, strides = var_5428, weight = up_blocks_0_resnets_0_conv1_weight_to_fp16, x = input_243_cast_fp16)[name = tensor("hidden_states_141_cast_fp16")]; tensor var_5436 = const()[name = tensor("op_5436"), val = tensor([1, 1])]; tensor var_5438 = const()[name = tensor("op_5438"), val = tensor([1, 1])]; tensor temb_21_pad_type_0 = const()[name = tensor("temb_21_pad_type_0"), val = tensor("custom")]; tensor temb_21_pad_0 = const()[name = tensor("temb_21_pad_0"), val = tensor([0, 0, 0, 0])]; tensor up_blocks_0_resnets_0_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(762358848)))]; tensor up_blocks_0_resnets_0_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765635712)))]; tensor temb_21_cast_fp16 = conv(bias = up_blocks_0_resnets_0_time_emb_proj_bias_to_fp16, dilations = var_5438, groups = var_5405, pad = temb_21_pad_0, pad_type = temb_21_pad_type_0, strides = var_5436, weight = up_blocks_0_resnets_0_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_21_cast_fp16")]; tensor input_247_cast_fp16 = add(x = hidden_states_141_cast_fp16, y = temb_21_cast_fp16)[name = tensor("input_247_cast_fp16")]; tensor reshape_112_shape_0 = const()[name = tensor("reshape_112_shape_0"), val = tensor([2, 32, 40, 6, 6])]; tensor reshape_112_cast_fp16 = reshape(shape = reshape_112_shape_0, x = input_247_cast_fp16)[name = tensor("reshape_112_cast_fp16")]; tensor reduce_mean_84_axes_0 = const()[name = tensor("reduce_mean_84_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_84_keep_dims_0 = const()[name = tensor("reduce_mean_84_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_84_cast_fp16 = reduce_mean(axes = reduce_mean_84_axes_0, keep_dims = reduce_mean_84_keep_dims_0, x = reshape_112_cast_fp16)[name = tensor("reduce_mean_84_cast_fp16")]; tensor sub_56_cast_fp16 = sub(x = reshape_112_cast_fp16, y = reduce_mean_84_cast_fp16)[name = tensor("sub_56_cast_fp16")]; tensor square_28_cast_fp16 = square(x = sub_56_cast_fp16)[name = tensor("square_28_cast_fp16")]; tensor reduce_mean_86_axes_0 = const()[name = tensor("reduce_mean_86_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_86_keep_dims_0 = const()[name = tensor("reduce_mean_86_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_86_cast_fp16 = reduce_mean(axes = reduce_mean_86_axes_0, keep_dims = reduce_mean_86_keep_dims_0, x = square_28_cast_fp16)[name = tensor("reduce_mean_86_cast_fp16")]; tensor add_56_y_0_to_fp16 = const()[name = tensor("add_56_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_56_cast_fp16 = add(x = reduce_mean_86_cast_fp16, y = add_56_y_0_to_fp16)[name = tensor("add_56_cast_fp16")]; tensor sqrt_28_cast_fp16 = sqrt(x = add_56_cast_fp16)[name = tensor("sqrt_28_cast_fp16")]; tensor real_div_28_cast_fp16 = real_div(x = sub_56_cast_fp16, y = sqrt_28_cast_fp16)[name = tensor("real_div_28_cast_fp16")]; tensor reshape_113_shape_0 = const()[name = tensor("reshape_113_shape_0"), val = tensor([2, 1280, 6, 6])]; tensor reshape_113_cast_fp16 = reshape(shape = reshape_113_shape_0, x = real_div_28_cast_fp16)[name = tensor("reshape_113_cast_fp16")]; tensor add_57_gamma_0_to_fp16 = const()[name = tensor("add_57_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765638336)))]; tensor add_57_beta_0_to_fp16 = const()[name = tensor("add_57_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765640960)))]; tensor add_57_epsilon_0_to_fp16 = const()[name = tensor("add_57_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_57_cast_fp16 = batch_norm(beta = add_57_beta_0_to_fp16, epsilon = add_57_epsilon_0_to_fp16, gamma = add_57_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_113_cast_fp16)[name = tensor("add_57_cast_fp16")]; tensor input_251_cast_fp16 = silu(x = add_57_cast_fp16)[name = tensor("input_251_cast_fp16")]; tensor var_5448 = const()[name = tensor("op_5448"), val = tensor([1, 1])]; tensor var_5450 = const()[name = tensor("op_5450"), val = tensor([1, 1])]; tensor hidden_states_143_pad_type_0 = const()[name = tensor("hidden_states_143_pad_type_0"), val = tensor("custom")]; tensor hidden_states_143_pad_0 = const()[name = tensor("hidden_states_143_pad_0"), val = tensor([1, 1, 1, 1])]; tensor up_blocks_0_resnets_0_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(765643584)))]; tensor up_blocks_0_resnets_0_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(795134848)))]; tensor hidden_states_143_cast_fp16 = conv(bias = up_blocks_0_resnets_0_conv2_bias_to_fp16, dilations = var_5450, groups = var_5405, pad = hidden_states_143_pad_0, pad_type = hidden_states_143_pad_type_0, strides = var_5448, weight = up_blocks_0_resnets_0_conv2_weight_to_fp16, x = input_251_cast_fp16)[name = tensor("hidden_states_143_cast_fp16")]; tensor var_5455 = const()[name = tensor("op_5455"), val = tensor([1, 1])]; tensor var_5457 = const()[name = tensor("op_5457"), val = tensor([1, 1])]; tensor x_5_pad_type_0 = const()[name = tensor("x_5_pad_type_0"), val = tensor("custom")]; tensor x_5_pad_0 = const()[name = tensor("x_5_pad_0"), val = tensor([0, 0, 0, 0])]; tensor up_blocks_0_resnets_0_conv_shortcut_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv_shortcut_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(795137472)))]; tensor up_blocks_0_resnets_0_conv_shortcut_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_0_conv_shortcut_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801691136)))]; tensor x_5_cast_fp16 = conv(bias = up_blocks_0_resnets_0_conv_shortcut_bias_to_fp16, dilations = var_5457, groups = var_5405, pad = x_5_pad_0, pad_type = x_5_pad_type_0, strides = var_5455, weight = up_blocks_0_resnets_0_conv_shortcut_weight_to_fp16, x = input_239_cast_fp16)[name = tensor("x_5_cast_fp16")]; tensor hidden_states_145_cast_fp16 = add(x = x_5_cast_fp16, y = hidden_states_143_cast_fp16)[name = tensor("hidden_states_145_cast_fp16")]; tensor input_253_interleave_0 = const()[name = tensor("input_253_interleave_0"), val = tensor(false)]; tensor input_253_cast_fp16_1 = concat(axis = var_5405, interleave = input_253_interleave_0, values = (hidden_states_145_cast_fp16, input_185_cast_fp16))[name = tensor("input_253_cast_fp16")]; tensor reshape_116_shape_0 = const()[name = tensor("reshape_116_shape_0"), val = tensor([2, 32, 80, 6, 6])]; tensor reshape_116_cast_fp16 = reshape(shape = reshape_116_shape_0, x = input_253_cast_fp16_1)[name = tensor("reshape_116_cast_fp16")]; tensor reduce_mean_87_axes_0 = const()[name = tensor("reduce_mean_87_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_87_keep_dims_0 = const()[name = tensor("reduce_mean_87_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_87_cast_fp16 = reduce_mean(axes = reduce_mean_87_axes_0, keep_dims = reduce_mean_87_keep_dims_0, x = reshape_116_cast_fp16)[name = tensor("reduce_mean_87_cast_fp16")]; tensor sub_58_cast_fp16 = sub(x = reshape_116_cast_fp16, y = reduce_mean_87_cast_fp16)[name = tensor("sub_58_cast_fp16")]; tensor square_29_cast_fp16 = square(x = sub_58_cast_fp16)[name = tensor("square_29_cast_fp16")]; tensor reduce_mean_89_axes_0 = const()[name = tensor("reduce_mean_89_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_89_keep_dims_0 = const()[name = tensor("reduce_mean_89_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_89_cast_fp16 = reduce_mean(axes = reduce_mean_89_axes_0, keep_dims = reduce_mean_89_keep_dims_0, x = square_29_cast_fp16)[name = tensor("reduce_mean_89_cast_fp16")]; tensor add_58_y_0_to_fp16 = const()[name = tensor("add_58_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_58_cast_fp16 = add(x = reduce_mean_89_cast_fp16, y = add_58_y_0_to_fp16)[name = tensor("add_58_cast_fp16")]; tensor sqrt_29_cast_fp16 = sqrt(x = add_58_cast_fp16)[name = tensor("sqrt_29_cast_fp16")]; tensor real_div_29_cast_fp16 = real_div(x = sub_58_cast_fp16, y = sqrt_29_cast_fp16)[name = tensor("real_div_29_cast_fp16")]; tensor reshape_117_shape_0 = const()[name = tensor("reshape_117_shape_0"), val = tensor([2, 2560, 6, 6])]; tensor reshape_117_cast_fp16 = reshape(shape = reshape_117_shape_0, x = real_div_29_cast_fp16)[name = tensor("reshape_117_cast_fp16")]; tensor add_59_gamma_0_to_fp16 = const()[name = tensor("add_59_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801693760)))]; tensor add_59_beta_0_to_fp16 = const()[name = tensor("add_59_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801698944)))]; tensor add_59_epsilon_0_to_fp16 = const()[name = tensor("add_59_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_59_cast_fp16 = batch_norm(beta = add_59_beta_0_to_fp16, epsilon = add_59_epsilon_0_to_fp16, gamma = add_59_gamma_0_to_fp16, mean = add_55_mean_0_to_fp16, variance = add_55_variance_0_to_fp16, x = reshape_117_cast_fp16)[name = tensor("add_59_cast_fp16")]; tensor input_257_cast_fp16 = silu(x = add_59_cast_fp16)[name = tensor("input_257_cast_fp16")]; tensor var_5475 = const()[name = tensor("op_5475"), val = tensor([1, 1])]; tensor var_5477 = const()[name = tensor("op_5477"), val = tensor([1, 1])]; tensor hidden_states_147_pad_type_0 = const()[name = tensor("hidden_states_147_pad_type_0"), val = tensor("custom")]; tensor hidden_states_147_pad_0 = const()[name = tensor("hidden_states_147_pad_0"), val = tensor([1, 1, 1, 1])]; tensor up_blocks_0_resnets_1_conv1_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_conv1_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(801704128)))]; tensor up_blocks_0_resnets_1_conv1_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_conv1_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(860686592)))]; tensor hidden_states_147_cast_fp16 = conv(bias = up_blocks_0_resnets_1_conv1_bias_to_fp16, dilations = var_5477, groups = var_5405, pad = hidden_states_147_pad_0, pad_type = hidden_states_147_pad_type_0, strides = var_5475, weight = up_blocks_0_resnets_1_conv1_weight_to_fp16, x = input_257_cast_fp16)[name = tensor("hidden_states_147_cast_fp16")]; tensor var_5483 = const()[name = tensor("op_5483"), val = tensor([1, 1])]; tensor var_5485 = const()[name = tensor("op_5485"), val = tensor([1, 1])]; tensor temb_23_pad_type_0 = const()[name = tensor("temb_23_pad_type_0"), val = tensor("custom")]; tensor temb_23_pad_0 = const()[name = tensor("temb_23_pad_0"), val = tensor([0, 0, 0, 0])]; tensor up_blocks_0_resnets_1_time_emb_proj_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_time_emb_proj_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(860689216)))]; tensor up_blocks_0_resnets_1_time_emb_proj_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_time_emb_proj_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(863966080)))]; tensor temb_23_cast_fp16 = conv(bias = up_blocks_0_resnets_1_time_emb_proj_bias_to_fp16, dilations = var_5485, groups = var_5405, pad = temb_23_pad_0, pad_type = temb_23_pad_type_0, strides = var_5483, weight = up_blocks_0_resnets_1_time_emb_proj_weight_to_fp16, x = input_15_cast_fp16_1)[name = tensor("temb_23_cast_fp16")]; tensor input_261_cast_fp16 = add(x = hidden_states_147_cast_fp16, y = temb_23_cast_fp16)[name = tensor("input_261_cast_fp16")]; tensor reshape_120_shape_0 = const()[name = tensor("reshape_120_shape_0"), val = tensor([2, 32, 40, 6, 6])]; tensor reshape_120_cast_fp16 = reshape(shape = reshape_120_shape_0, x = input_261_cast_fp16)[name = tensor("reshape_120_cast_fp16")]; tensor reduce_mean_90_axes_0 = const()[name = tensor("reduce_mean_90_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_90_keep_dims_0 = const()[name = tensor("reduce_mean_90_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_90_cast_fp16 = reduce_mean(axes = reduce_mean_90_axes_0, keep_dims = reduce_mean_90_keep_dims_0, x = reshape_120_cast_fp16)[name = tensor("reduce_mean_90_cast_fp16")]; tensor sub_60_cast_fp16 = sub(x = reshape_120_cast_fp16, y = reduce_mean_90_cast_fp16)[name = tensor("sub_60_cast_fp16")]; tensor square_30_cast_fp16 = square(x = sub_60_cast_fp16)[name = tensor("square_30_cast_fp16")]; tensor reduce_mean_92_axes_0 = const()[name = tensor("reduce_mean_92_axes_0"), val = tensor([2, 3, 4])]; tensor reduce_mean_92_keep_dims_0 = const()[name = tensor("reduce_mean_92_keep_dims_0"), val = tensor(true)]; tensor reduce_mean_92_cast_fp16 = reduce_mean(axes = reduce_mean_92_axes_0, keep_dims = reduce_mean_92_keep_dims_0, x = square_30_cast_fp16)[name = tensor("reduce_mean_92_cast_fp16")]; tensor add_60_y_0_to_fp16 = const()[name = tensor("add_60_y_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_60_cast_fp16 = add(x = reduce_mean_92_cast_fp16, y = add_60_y_0_to_fp16)[name = tensor("add_60_cast_fp16")]; tensor sqrt_30_cast_fp16 = sqrt(x = add_60_cast_fp16)[name = tensor("sqrt_30_cast_fp16")]; tensor real_div_30_cast_fp16 = real_div(x = sub_60_cast_fp16, y = sqrt_30_cast_fp16)[name = tensor("real_div_30_cast_fp16")]; tensor reshape_121_shape_0 = const()[name = tensor("reshape_121_shape_0"), val = tensor([2, 1280, 6, 6])]; tensor reshape_121_cast_fp16 = reshape(shape = reshape_121_shape_0, x = real_div_30_cast_fp16)[name = tensor("reshape_121_cast_fp16")]; tensor add_61_gamma_0_to_fp16 = const()[name = tensor("add_61_gamma_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(863968704)))]; tensor add_61_beta_0_to_fp16 = const()[name = tensor("add_61_beta_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(863971328)))]; tensor add_61_epsilon_0_to_fp16 = const()[name = tensor("add_61_epsilon_0_to_fp16"), val = tensor(0x1.5p-17)]; tensor add_61_cast_fp16 = batch_norm(beta = add_61_beta_0_to_fp16, epsilon = add_61_epsilon_0_to_fp16, gamma = add_61_gamma_0_to_fp16, mean = add_27_mean_0_to_fp16, variance = add_27_variance_0_to_fp16, x = reshape_121_cast_fp16)[name = tensor("add_61_cast_fp16")]; tensor input_265_cast_fp16 = silu(x = add_61_cast_fp16)[name = tensor("input_265_cast_fp16")]; tensor var_5495 = const()[name = tensor("op_5495"), val = tensor([1, 1])]; tensor var_5497 = const()[name = tensor("op_5497"), val = tensor([1, 1])]; tensor hidden_states_149_pad_type_0 = const()[name = tensor("hidden_states_149_pad_type_0"), val = tensor("custom")]; tensor hidden_states_149_pad_0 = const()[name = tensor("hidden_states_149_pad_0"), val = tensor([1, 1, 1, 1])]; tensor up_blocks_0_resnets_1_conv2_weight_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_conv2_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(863973952)))]; tensor up_blocks_0_resnets_1_conv2_bias_to_fp16 = const()[name = tensor("up_blocks_0_resnets_1_conv2_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(893465216)))]; tensor hidden_states_149_cast_fp16_1 = conv(bias = up_blocks_0_resnets_1_conv2_bias_to_fp16, dilations = var_5497, groups = var_5405, pad = hidden_states_149_pad_0, pad_type = hidden_states_149_pad_type_0, strides = var_5495, weight = up_blocks_0_resnets_1_conv2_weight_to_fp16, x = input_265_cast_fp16)[name = tensor("hidden_states_149_cast_fp16")]; tensor input_117_cast_fp16_dtype_0 = const()[name = tensor("input_117_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_7_cast_fp16_dtype_0 = const()[name = tensor("input_7_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_115_cast_fp16_dtype_0 = const()[name = tensor("input_115_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_89_cast_fp16_dtype_0 = const()[name = tensor("input_89_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_171_cast_fp16_dtype_0 = const()[name = tensor("input_171_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_15_cast_fp16_dtype_0 = const()[name = tensor("input_15_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_253_cast_fp16_dtype_0 = const()[name = tensor("input_253_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor hidden_states_149_cast_fp16_dtype_0 = const()[name = tensor("hidden_states_149_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_35_cast_fp16_dtype_0 = const()[name = tensor("input_35_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_143_cast_fp16_dtype_0 = const()[name = tensor("input_143_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_169_cast_fp16_dtype_0 = const()[name = tensor("input_169_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_63_cast_fp16_dtype_0 = const()[name = tensor("input_63_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_61_cast_fp16_dtype_0 = const()[name = tensor("input_61_cast_fp16_dtype_0"), val = tensor("fp32")]; tensor input_61_cast_fp16 = cast(dtype = input_61_cast_fp16_dtype_0, x = input_61_cast_fp16_1)[name = tensor("cast_13")]; tensor input_63_cast_fp16 = cast(dtype = input_63_cast_fp16_dtype_0, x = input_63_cast_fp16_1)[name = tensor("cast_14")]; tensor input_169_cast_fp16 = cast(dtype = input_169_cast_fp16_dtype_0, x = input_169_cast_fp16_1)[name = tensor("cast_15")]; tensor input_143_cast_fp16 = cast(dtype = input_143_cast_fp16_dtype_0, x = input_143_cast_fp16_1)[name = tensor("cast_16")]; tensor input_35_cast_fp16 = cast(dtype = input_35_cast_fp16_dtype_0, x = input_35_cast_fp16_1)[name = tensor("cast_17")]; tensor hidden_states_149_cast_fp16 = cast(dtype = hidden_states_149_cast_fp16_dtype_0, x = hidden_states_149_cast_fp16_1)[name = tensor("cast_18")]; tensor input_253_cast_fp16 = cast(dtype = input_253_cast_fp16_dtype_0, x = input_253_cast_fp16_1)[name = tensor("cast_19")]; tensor input_15_cast_fp16 = cast(dtype = input_15_cast_fp16_dtype_0, x = input_15_cast_fp16_1)[name = tensor("cast_20")]; tensor input_171_cast_fp16 = cast(dtype = input_171_cast_fp16_dtype_0, x = input_171_cast_fp16_1)[name = tensor("cast_21")]; tensor input_89_cast_fp16 = cast(dtype = input_89_cast_fp16_dtype_0, x = input_89_cast_fp16_1)[name = tensor("cast_22")]; tensor input_115_cast_fp16 = cast(dtype = input_115_cast_fp16_dtype_0, x = input_115_cast_fp16_1)[name = tensor("cast_23")]; tensor input_7_cast_fp16 = cast(dtype = input_7_cast_fp16_dtype_0, x = input_7_cast_fp16_1)[name = tensor("cast_24")]; tensor input_117_cast_fp16 = cast(dtype = input_117_cast_fp16_dtype_0, x = input_117_cast_fp16_1)[name = tensor("cast_25")]; } -> (input_117_cast_fp16, input_7_cast_fp16, input_115_cast_fp16, input_89_cast_fp16, input_171_cast_fp16, input_15_cast_fp16, input_253_cast_fp16, hidden_states_149_cast_fp16, input_35_cast_fp16, input_143_cast_fp16, input_169_cast_fp16, input_63_cast_fp16, input_61_cast_fp16); }