program(1.0)
[buildInfo = dict<tensor<string, []>, tensor<string, []>>({{"coremlc-component-MIL", "5.33.5"}, {"coremlc-version", "1877.40.3"}, {"coremltools-component-torch", "2.2.1"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "7.1"}})]
{
    func main<ios16>(tensor<fp16, [1, 80, 1, 3000]> melspectrogram_features) {
            tensor<int32, [2]> var_38 = const()[name = tensor<string, []>("op_38"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_44 = const()[name = tensor<string, []>("op_44"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, []> var_49 = const()[name = tensor<string, []>("op_49"), val = tensor<int32, []>(1)];
            tensor<string, []> var_54_pad_type_0 = const()[name = tensor<string, []>("op_54_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_54_pad_0 = const()[name = tensor<string, []>("op_54_pad_0"), val = tensor<int32, [4]>([0, 0, 1, 1])];
            tensor<fp16, [512, 80, 1, 3]> var_29_to_fp16 = const()[name = tensor<string, []>("op_29_to_fp16"), val = tensor<fp16, [512, 80, 1, 3]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(64)))];
            tensor<fp16, [512]> var_35_to_fp16 = const()[name = tensor<string, []>("op_35_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(245888)))];
            tensor<fp16, [1, 512, 1, 3000]> var_54_cast_fp16 = conv(bias = var_35_to_fp16, dilations = var_44, groups = var_49, pad = var_54_pad_0, pad_type = var_54_pad_type_0, strides = var_38, weight = var_29_to_fp16, x = melspectrogram_features)[name = tensor<string, []>("op_54_cast_fp16")];
            tensor<string, []> hidden_states_1_mode_0 = const()[name = tensor<string, []>("hidden_states_1_mode_0"), val = tensor<string, []>("EXACT")];
            tensor<fp16, [1, 512, 1, 3000]> hidden_states_1_cast_fp16 = gelu(mode = hidden_states_1_mode_0, x = var_54_cast_fp16)[name = tensor<string, []>("hidden_states_1_cast_fp16")];
            tensor<int32, [2]> var_78 = const()[name = tensor<string, []>("op_78"), val = tensor<int32, [2]>([2, 2])];
            tensor<int32, [2]> var_84 = const()[name = tensor<string, []>("op_84"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, []> var_89 = const()[name = tensor<string, []>("op_89"), val = tensor<int32, []>(1)];
            tensor<string, []> var_94_pad_type_0 = const()[name = tensor<string, []>("op_94_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> var_94_pad_0 = const()[name = tensor<string, []>("op_94_pad_0"), val = tensor<int32, [4]>([0, 0, 1, 1])];
            tensor<fp16, [512, 512, 1, 3]> var_69_to_fp16 = const()[name = tensor<string, []>("op_69_to_fp16"), val = tensor<fp16, [512, 512, 1, 3]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(246976)))];
            tensor<fp16, [512]> var_75_to_fp16 = const()[name = tensor<string, []>("op_75_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1819904)))];
            tensor<fp16, [1, 512, 1, 1500]> var_94_cast_fp16 = conv(bias = var_75_to_fp16, dilations = var_84, groups = var_89, pad = var_94_pad_0, pad_type = var_94_pad_type_0, strides = var_78, weight = var_69_to_fp16, x = hidden_states_1_cast_fp16)[name = tensor<string, []>("op_94_cast_fp16")];
            tensor<string, []> hidden_states_3_mode_0 = const()[name = tensor<string, []>("hidden_states_3_mode_0"), val = tensor<string, []>("EXACT")];
            tensor<fp16, [1, 512, 1, 1500]> hidden_states_3_cast_fp16 = gelu(mode = hidden_states_3_mode_0, x = var_94_cast_fp16)[name = tensor<string, []>("hidden_states_3_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> var_112_to_fp16 = const()[name = tensor<string, []>("op_112_to_fp16"), val = tensor<fp16, [1, 512, 1, 1500]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(1820992)))];
            tensor<fp16, [1, 512, 1, 1500]> inputs_1_cast_fp16 = add(x = hidden_states_3_cast_fp16, y = var_112_to_fp16)[name = tensor<string, []>("inputs_1_cast_fp16")];
            tensor<int32, []> var_122 = const()[name = tensor<string, []>("op_122"), val = tensor<int32, []>(3)];
            tensor<int32, []> var_135 = const()[name = tensor<string, []>("op_135"), val = tensor<int32, []>(1)];
            tensor<bool, []> var_136 = const()[name = tensor<string, []>("op_136"), val = tensor<bool, []>(true)];
            tensor<int32, [1]> var_146 = const()[name = tensor<string, []>("op_146"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_1_cast_fp16 = reduce_mean(axes = var_146, keep_dims = var_136, x = inputs_1_cast_fp16)[name = tensor<string, []>("channels_mean_1_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_1_cast_fp16 = sub(x = inputs_1_cast_fp16, y = channels_mean_1_cast_fp16)[name = tensor<string, []>("zero_mean_1_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_1_cast_fp16 = mul(x = zero_mean_1_cast_fp16, y = zero_mean_1_cast_fp16)[name = tensor<string, []>("zero_mean_sq_1_cast_fp16")];
            tensor<int32, [1]> var_150 = const()[name = tensor<string, []>("op_150"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_151_cast_fp16 = reduce_mean(axes = var_150, keep_dims = var_136, x = zero_mean_sq_1_cast_fp16)[name = tensor<string, []>("op_151_cast_fp16")];
            tensor<fp16, []> var_152_to_fp16 = const()[name = tensor<string, []>("op_152_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_153_cast_fp16 = add(x = var_151_cast_fp16, y = var_152_to_fp16)[name = tensor<string, []>("op_153_cast_fp16")];
            tensor<fp16, []> denom_1_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_1_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_1_cast_fp16 = rsqrt(epsilon = denom_1_epsilon_0_to_fp16, x = var_153_cast_fp16)[name = tensor<string, []>("denom_1_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_1_cast_fp16 = mul(x = zero_mean_1_cast_fp16, y = denom_1_cast_fp16)[name = tensor<string, []>("out_1_cast_fp16")];
            tensor<fp16, [512]> obj_1_mean_0_to_fp16 = const()[name = tensor<string, []>("obj_1_mean_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3357056)))];
            tensor<fp16, [512]> obj_1_variance_0_to_fp16 = const()[name = tensor<string, []>("obj_1_variance_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3358144)))];
            tensor<fp16, [512]> obj_1_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_1_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3359232)))];
            tensor<fp16, [512]> obj_1_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_1_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3360320)))];
            tensor<fp16, []> obj_1_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_1_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> obj_1_cast_fp16 = batch_norm(beta = obj_1_beta_0_to_fp16, epsilon = obj_1_epsilon_0_to_fp16, gamma = obj_1_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_1_cast_fp16)[name = tensor<string, []>("obj_1_cast_fp16")];
            tensor<int32, [2]> var_168 = const()[name = tensor<string, []>("op_168"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_170 = const()[name = tensor<string, []>("op_170"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_1_pad_type_0 = const()[name = tensor<string, []>("query_1_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_1_pad_0 = const()[name = tensor<string, []>("query_1_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_0_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3361408)))];
            tensor<fp16, [512]> layers_0_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3885760)))];
            tensor<fp16, [1, 512, 1, 1500]> query_1_cast_fp16 = conv(bias = layers_0_self_attn_q_proj_bias_to_fp16, dilations = var_170, groups = var_135, pad = query_1_pad_0, pad_type = query_1_pad_type_0, strides = var_168, weight = layers_0_self_attn_q_proj_weight_to_fp16, x = obj_1_cast_fp16)[name = tensor<string, []>("query_1_cast_fp16")];
            tensor<int32, [2]> var_174 = const()[name = tensor<string, []>("op_174"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_176 = const()[name = tensor<string, []>("op_176"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_1_pad_type_0 = const()[name = tensor<string, []>("key_1_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_1_pad_0 = const()[name = tensor<string, []>("key_1_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_0_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(3886848)))];
            tensor<fp16, [1, 512, 1, 1500]> key_1_cast_fp16 = conv(dilations = var_176, groups = var_135, pad = key_1_pad_0, pad_type = key_1_pad_type_0, strides = var_174, weight = layers_0_self_attn_k_proj_weight_to_fp16, x = obj_1_cast_fp16)[name = tensor<string, []>("key_1_cast_fp16")];
            tensor<int32, [2]> var_181 = const()[name = tensor<string, []>("op_181"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_183 = const()[name = tensor<string, []>("op_183"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_1_pad_type_0 = const()[name = tensor<string, []>("value_1_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_1_pad_0 = const()[name = tensor<string, []>("value_1_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_0_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4411200)))];
            tensor<fp16, [512]> layers_0_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4935552)))];
            tensor<fp16, [1, 512, 1, 1500]> value_1_cast_fp16 = conv(bias = layers_0_self_attn_v_proj_bias_to_fp16, dilations = var_183, groups = var_135, pad = value_1_pad_0, pad_type = value_1_pad_type_0, strides = var_181, weight = layers_0_self_attn_v_proj_weight_to_fp16, x = obj_1_cast_fp16)[name = tensor<string, []>("value_1_cast_fp16")];
            tensor<int32, [4]> var_190_begin_0 = const()[name = tensor<string, []>("op_190_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_190_end_0 = const()[name = tensor<string, []>("op_190_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_190_end_mask_0 = const()[name = tensor<string, []>("op_190_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_190_cast_fp16 = slice_by_index(begin = var_190_begin_0, end = var_190_end_0, end_mask = var_190_end_mask_0, x = query_1_cast_fp16)[name = tensor<string, []>("op_190_cast_fp16")];
            tensor<int32, [4]> var_194_begin_0 = const()[name = tensor<string, []>("op_194_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_194_end_0 = const()[name = tensor<string, []>("op_194_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_194_end_mask_0 = const()[name = tensor<string, []>("op_194_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_194_cast_fp16 = slice_by_index(begin = var_194_begin_0, end = var_194_end_0, end_mask = var_194_end_mask_0, x = query_1_cast_fp16)[name = tensor<string, []>("op_194_cast_fp16")];
            tensor<int32, [4]> var_198_begin_0 = const()[name = tensor<string, []>("op_198_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_198_end_0 = const()[name = tensor<string, []>("op_198_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_198_end_mask_0 = const()[name = tensor<string, []>("op_198_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_198_cast_fp16 = slice_by_index(begin = var_198_begin_0, end = var_198_end_0, end_mask = var_198_end_mask_0, x = query_1_cast_fp16)[name = tensor<string, []>("op_198_cast_fp16")];
            tensor<int32, [4]> var_202_begin_0 = const()[name = tensor<string, []>("op_202_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_202_end_0 = const()[name = tensor<string, []>("op_202_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_202_end_mask_0 = const()[name = tensor<string, []>("op_202_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_202_cast_fp16 = slice_by_index(begin = var_202_begin_0, end = var_202_end_0, end_mask = var_202_end_mask_0, x = query_1_cast_fp16)[name = tensor<string, []>("op_202_cast_fp16")];
            tensor<int32, [4]> var_206_begin_0 = const()[name = tensor<string, []>("op_206_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_206_end_0 = const()[name = tensor<string, []>("op_206_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_206_end_mask_0 = const()[name = tensor<string, []>("op_206_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_206_cast_fp16 = slice_by_index(begin = var_206_begin_0, end = var_206_end_0, end_mask = var_206_end_mask_0, x = query_1_cast_fp16)[name = tensor<string, []>("op_206_cast_fp16")];
            tensor<int32, [4]> var_210_begin_0 = const()[name = tensor<string, []>("op_210_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_210_end_0 = const()[name = tensor<string, []>("op_210_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_210_end_mask_0 = const()[name = tensor<string, []>("op_210_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_210_cast_fp16 = slice_by_index(begin = var_210_begin_0, end = var_210_end_0, end_mask = var_210_end_mask_0, x = query_1_cast_fp16)[name = tensor<string, []>("op_210_cast_fp16")];
            tensor<int32, [4]> var_214_begin_0 = const()[name = tensor<string, []>("op_214_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_214_end_0 = const()[name = tensor<string, []>("op_214_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_214_end_mask_0 = const()[name = tensor<string, []>("op_214_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_214_cast_fp16 = slice_by_index(begin = var_214_begin_0, end = var_214_end_0, end_mask = var_214_end_mask_0, x = query_1_cast_fp16)[name = tensor<string, []>("op_214_cast_fp16")];
            tensor<int32, [4]> var_218_begin_0 = const()[name = tensor<string, []>("op_218_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_218_end_0 = const()[name = tensor<string, []>("op_218_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_218_end_mask_0 = const()[name = tensor<string, []>("op_218_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_218_cast_fp16 = slice_by_index(begin = var_218_begin_0, end = var_218_end_0, end_mask = var_218_end_mask_0, x = query_1_cast_fp16)[name = tensor<string, []>("op_218_cast_fp16")];
            tensor<int32, [4]> var_227_begin_0 = const()[name = tensor<string, []>("op_227_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_227_end_0 = const()[name = tensor<string, []>("op_227_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_227_end_mask_0 = const()[name = tensor<string, []>("op_227_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_227_cast_fp16 = slice_by_index(begin = var_227_begin_0, end = var_227_end_0, end_mask = var_227_end_mask_0, x = var_190_cast_fp16)[name = tensor<string, []>("op_227_cast_fp16")];
            tensor<int32, [4]> var_234_begin_0 = const()[name = tensor<string, []>("op_234_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_234_end_0 = const()[name = tensor<string, []>("op_234_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_234_end_mask_0 = const()[name = tensor<string, []>("op_234_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_234_cast_fp16 = slice_by_index(begin = var_234_begin_0, end = var_234_end_0, end_mask = var_234_end_mask_0, x = var_190_cast_fp16)[name = tensor<string, []>("op_234_cast_fp16")];
            tensor<int32, [4]> var_241_begin_0 = const()[name = tensor<string, []>("op_241_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_241_end_0 = const()[name = tensor<string, []>("op_241_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_241_end_mask_0 = const()[name = tensor<string, []>("op_241_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_241_cast_fp16 = slice_by_index(begin = var_241_begin_0, end = var_241_end_0, end_mask = var_241_end_mask_0, x = var_190_cast_fp16)[name = tensor<string, []>("op_241_cast_fp16")];
            tensor<int32, [4]> var_248_begin_0 = const()[name = tensor<string, []>("op_248_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_248_end_0 = const()[name = tensor<string, []>("op_248_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_248_end_mask_0 = const()[name = tensor<string, []>("op_248_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_248_cast_fp16 = slice_by_index(begin = var_248_begin_0, end = var_248_end_0, end_mask = var_248_end_mask_0, x = var_190_cast_fp16)[name = tensor<string, []>("op_248_cast_fp16")];
            tensor<int32, [4]> var_255_begin_0 = const()[name = tensor<string, []>("op_255_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_255_end_0 = const()[name = tensor<string, []>("op_255_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_255_end_mask_0 = const()[name = tensor<string, []>("op_255_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_255_cast_fp16 = slice_by_index(begin = var_255_begin_0, end = var_255_end_0, end_mask = var_255_end_mask_0, x = var_194_cast_fp16)[name = tensor<string, []>("op_255_cast_fp16")];
            tensor<int32, [4]> var_262_begin_0 = const()[name = tensor<string, []>("op_262_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_262_end_0 = const()[name = tensor<string, []>("op_262_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_262_end_mask_0 = const()[name = tensor<string, []>("op_262_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_262_cast_fp16 = slice_by_index(begin = var_262_begin_0, end = var_262_end_0, end_mask = var_262_end_mask_0, x = var_194_cast_fp16)[name = tensor<string, []>("op_262_cast_fp16")];
            tensor<int32, [4]> var_269_begin_0 = const()[name = tensor<string, []>("op_269_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_269_end_0 = const()[name = tensor<string, []>("op_269_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_269_end_mask_0 = const()[name = tensor<string, []>("op_269_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_269_cast_fp16 = slice_by_index(begin = var_269_begin_0, end = var_269_end_0, end_mask = var_269_end_mask_0, x = var_194_cast_fp16)[name = tensor<string, []>("op_269_cast_fp16")];
            tensor<int32, [4]> var_276_begin_0 = const()[name = tensor<string, []>("op_276_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_276_end_0 = const()[name = tensor<string, []>("op_276_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_276_end_mask_0 = const()[name = tensor<string, []>("op_276_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_276_cast_fp16 = slice_by_index(begin = var_276_begin_0, end = var_276_end_0, end_mask = var_276_end_mask_0, x = var_194_cast_fp16)[name = tensor<string, []>("op_276_cast_fp16")];
            tensor<int32, [4]> var_283_begin_0 = const()[name = tensor<string, []>("op_283_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_283_end_0 = const()[name = tensor<string, []>("op_283_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_283_end_mask_0 = const()[name = tensor<string, []>("op_283_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_283_cast_fp16 = slice_by_index(begin = var_283_begin_0, end = var_283_end_0, end_mask = var_283_end_mask_0, x = var_198_cast_fp16)[name = tensor<string, []>("op_283_cast_fp16")];
            tensor<int32, [4]> var_290_begin_0 = const()[name = tensor<string, []>("op_290_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_290_end_0 = const()[name = tensor<string, []>("op_290_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_290_end_mask_0 = const()[name = tensor<string, []>("op_290_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_290_cast_fp16 = slice_by_index(begin = var_290_begin_0, end = var_290_end_0, end_mask = var_290_end_mask_0, x = var_198_cast_fp16)[name = tensor<string, []>("op_290_cast_fp16")];
            tensor<int32, [4]> var_297_begin_0 = const()[name = tensor<string, []>("op_297_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_297_end_0 = const()[name = tensor<string, []>("op_297_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_297_end_mask_0 = const()[name = tensor<string, []>("op_297_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_297_cast_fp16 = slice_by_index(begin = var_297_begin_0, end = var_297_end_0, end_mask = var_297_end_mask_0, x = var_198_cast_fp16)[name = tensor<string, []>("op_297_cast_fp16")];
            tensor<int32, [4]> var_304_begin_0 = const()[name = tensor<string, []>("op_304_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_304_end_0 = const()[name = tensor<string, []>("op_304_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_304_end_mask_0 = const()[name = tensor<string, []>("op_304_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_304_cast_fp16 = slice_by_index(begin = var_304_begin_0, end = var_304_end_0, end_mask = var_304_end_mask_0, x = var_198_cast_fp16)[name = tensor<string, []>("op_304_cast_fp16")];
            tensor<int32, [4]> var_311_begin_0 = const()[name = tensor<string, []>("op_311_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_311_end_0 = const()[name = tensor<string, []>("op_311_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_311_end_mask_0 = const()[name = tensor<string, []>("op_311_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_311_cast_fp16 = slice_by_index(begin = var_311_begin_0, end = var_311_end_0, end_mask = var_311_end_mask_0, x = var_202_cast_fp16)[name = tensor<string, []>("op_311_cast_fp16")];
            tensor<int32, [4]> var_318_begin_0 = const()[name = tensor<string, []>("op_318_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_318_end_0 = const()[name = tensor<string, []>("op_318_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_318_end_mask_0 = const()[name = tensor<string, []>("op_318_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_318_cast_fp16 = slice_by_index(begin = var_318_begin_0, end = var_318_end_0, end_mask = var_318_end_mask_0, x = var_202_cast_fp16)[name = tensor<string, []>("op_318_cast_fp16")];
            tensor<int32, [4]> var_325_begin_0 = const()[name = tensor<string, []>("op_325_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_325_end_0 = const()[name = tensor<string, []>("op_325_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_325_end_mask_0 = const()[name = tensor<string, []>("op_325_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_325_cast_fp16 = slice_by_index(begin = var_325_begin_0, end = var_325_end_0, end_mask = var_325_end_mask_0, x = var_202_cast_fp16)[name = tensor<string, []>("op_325_cast_fp16")];
            tensor<int32, [4]> var_332_begin_0 = const()[name = tensor<string, []>("op_332_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_332_end_0 = const()[name = tensor<string, []>("op_332_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_332_end_mask_0 = const()[name = tensor<string, []>("op_332_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_332_cast_fp16 = slice_by_index(begin = var_332_begin_0, end = var_332_end_0, end_mask = var_332_end_mask_0, x = var_202_cast_fp16)[name = tensor<string, []>("op_332_cast_fp16")];
            tensor<int32, [4]> var_339_begin_0 = const()[name = tensor<string, []>("op_339_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_339_end_0 = const()[name = tensor<string, []>("op_339_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_339_end_mask_0 = const()[name = tensor<string, []>("op_339_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_339_cast_fp16 = slice_by_index(begin = var_339_begin_0, end = var_339_end_0, end_mask = var_339_end_mask_0, x = var_206_cast_fp16)[name = tensor<string, []>("op_339_cast_fp16")];
            tensor<int32, [4]> var_346_begin_0 = const()[name = tensor<string, []>("op_346_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_346_end_0 = const()[name = tensor<string, []>("op_346_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_346_end_mask_0 = const()[name = tensor<string, []>("op_346_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_346_cast_fp16 = slice_by_index(begin = var_346_begin_0, end = var_346_end_0, end_mask = var_346_end_mask_0, x = var_206_cast_fp16)[name = tensor<string, []>("op_346_cast_fp16")];
            tensor<int32, [4]> var_353_begin_0 = const()[name = tensor<string, []>("op_353_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_353_end_0 = const()[name = tensor<string, []>("op_353_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_353_end_mask_0 = const()[name = tensor<string, []>("op_353_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_353_cast_fp16 = slice_by_index(begin = var_353_begin_0, end = var_353_end_0, end_mask = var_353_end_mask_0, x = var_206_cast_fp16)[name = tensor<string, []>("op_353_cast_fp16")];
            tensor<int32, [4]> var_360_begin_0 = const()[name = tensor<string, []>("op_360_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_360_end_0 = const()[name = tensor<string, []>("op_360_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_360_end_mask_0 = const()[name = tensor<string, []>("op_360_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_360_cast_fp16 = slice_by_index(begin = var_360_begin_0, end = var_360_end_0, end_mask = var_360_end_mask_0, x = var_206_cast_fp16)[name = tensor<string, []>("op_360_cast_fp16")];
            tensor<int32, [4]> var_367_begin_0 = const()[name = tensor<string, []>("op_367_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_367_end_0 = const()[name = tensor<string, []>("op_367_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_367_end_mask_0 = const()[name = tensor<string, []>("op_367_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_367_cast_fp16 = slice_by_index(begin = var_367_begin_0, end = var_367_end_0, end_mask = var_367_end_mask_0, x = var_210_cast_fp16)[name = tensor<string, []>("op_367_cast_fp16")];
            tensor<int32, [4]> var_374_begin_0 = const()[name = tensor<string, []>("op_374_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_374_end_0 = const()[name = tensor<string, []>("op_374_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_374_end_mask_0 = const()[name = tensor<string, []>("op_374_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_374_cast_fp16 = slice_by_index(begin = var_374_begin_0, end = var_374_end_0, end_mask = var_374_end_mask_0, x = var_210_cast_fp16)[name = tensor<string, []>("op_374_cast_fp16")];
            tensor<int32, [4]> var_381_begin_0 = const()[name = tensor<string, []>("op_381_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_381_end_0 = const()[name = tensor<string, []>("op_381_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_381_end_mask_0 = const()[name = tensor<string, []>("op_381_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_381_cast_fp16 = slice_by_index(begin = var_381_begin_0, end = var_381_end_0, end_mask = var_381_end_mask_0, x = var_210_cast_fp16)[name = tensor<string, []>("op_381_cast_fp16")];
            tensor<int32, [4]> var_388_begin_0 = const()[name = tensor<string, []>("op_388_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_388_end_0 = const()[name = tensor<string, []>("op_388_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_388_end_mask_0 = const()[name = tensor<string, []>("op_388_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_388_cast_fp16 = slice_by_index(begin = var_388_begin_0, end = var_388_end_0, end_mask = var_388_end_mask_0, x = var_210_cast_fp16)[name = tensor<string, []>("op_388_cast_fp16")];
            tensor<int32, [4]> var_395_begin_0 = const()[name = tensor<string, []>("op_395_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_395_end_0 = const()[name = tensor<string, []>("op_395_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_395_end_mask_0 = const()[name = tensor<string, []>("op_395_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_395_cast_fp16 = slice_by_index(begin = var_395_begin_0, end = var_395_end_0, end_mask = var_395_end_mask_0, x = var_214_cast_fp16)[name = tensor<string, []>("op_395_cast_fp16")];
            tensor<int32, [4]> var_402_begin_0 = const()[name = tensor<string, []>("op_402_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_402_end_0 = const()[name = tensor<string, []>("op_402_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_402_end_mask_0 = const()[name = tensor<string, []>("op_402_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_402_cast_fp16 = slice_by_index(begin = var_402_begin_0, end = var_402_end_0, end_mask = var_402_end_mask_0, x = var_214_cast_fp16)[name = tensor<string, []>("op_402_cast_fp16")];
            tensor<int32, [4]> var_409_begin_0 = const()[name = tensor<string, []>("op_409_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_409_end_0 = const()[name = tensor<string, []>("op_409_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_409_end_mask_0 = const()[name = tensor<string, []>("op_409_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_409_cast_fp16 = slice_by_index(begin = var_409_begin_0, end = var_409_end_0, end_mask = var_409_end_mask_0, x = var_214_cast_fp16)[name = tensor<string, []>("op_409_cast_fp16")];
            tensor<int32, [4]> var_416_begin_0 = const()[name = tensor<string, []>("op_416_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_416_end_0 = const()[name = tensor<string, []>("op_416_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_416_end_mask_0 = const()[name = tensor<string, []>("op_416_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_416_cast_fp16 = slice_by_index(begin = var_416_begin_0, end = var_416_end_0, end_mask = var_416_end_mask_0, x = var_214_cast_fp16)[name = tensor<string, []>("op_416_cast_fp16")];
            tensor<int32, [4]> var_423_begin_0 = const()[name = tensor<string, []>("op_423_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_423_end_0 = const()[name = tensor<string, []>("op_423_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_423_end_mask_0 = const()[name = tensor<string, []>("op_423_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_423_cast_fp16 = slice_by_index(begin = var_423_begin_0, end = var_423_end_0, end_mask = var_423_end_mask_0, x = var_218_cast_fp16)[name = tensor<string, []>("op_423_cast_fp16")];
            tensor<int32, [4]> var_430_begin_0 = const()[name = tensor<string, []>("op_430_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_430_end_0 = const()[name = tensor<string, []>("op_430_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_430_end_mask_0 = const()[name = tensor<string, []>("op_430_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_430_cast_fp16 = slice_by_index(begin = var_430_begin_0, end = var_430_end_0, end_mask = var_430_end_mask_0, x = var_218_cast_fp16)[name = tensor<string, []>("op_430_cast_fp16")];
            tensor<int32, [4]> var_437_begin_0 = const()[name = tensor<string, []>("op_437_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_437_end_0 = const()[name = tensor<string, []>("op_437_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_437_end_mask_0 = const()[name = tensor<string, []>("op_437_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_437_cast_fp16 = slice_by_index(begin = var_437_begin_0, end = var_437_end_0, end_mask = var_437_end_mask_0, x = var_218_cast_fp16)[name = tensor<string, []>("op_437_cast_fp16")];
            tensor<int32, [4]> var_444_begin_0 = const()[name = tensor<string, []>("op_444_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_444_end_0 = const()[name = tensor<string, []>("op_444_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_444_end_mask_0 = const()[name = tensor<string, []>("op_444_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_444_cast_fp16 = slice_by_index(begin = var_444_begin_0, end = var_444_end_0, end_mask = var_444_end_mask_0, x = var_218_cast_fp16)[name = tensor<string, []>("op_444_cast_fp16")];
            tensor<int32, [4]> k_1_perm_0 = const()[name = tensor<string, []>("k_1_perm_0"), val = tensor<int32, [4]>([0, 3, 2, 1])];
            tensor<int32, [4]> var_449_begin_0 = const()[name = tensor<string, []>("op_449_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_449_end_0 = const()[name = tensor<string, []>("op_449_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 64])];
            tensor<bool, [4]> var_449_end_mask_0 = const()[name = tensor<string, []>("op_449_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 512]> transpose_5 = transpose(perm = k_1_perm_0, x = key_1_cast_fp16)[name = tensor<string, []>("transpose_5")];
            tensor<fp16, [1, 1500, 1, 64]> var_449_cast_fp16 = slice_by_index(begin = var_449_begin_0, end = var_449_end_0, end_mask = var_449_end_mask_0, x = transpose_5)[name = tensor<string, []>("op_449_cast_fp16")];
            tensor<int32, [4]> var_453_begin_0 = const()[name = tensor<string, []>("op_453_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 64])];
            tensor<int32, [4]> var_453_end_0 = const()[name = tensor<string, []>("op_453_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 128])];
            tensor<bool, [4]> var_453_end_mask_0 = const()[name = tensor<string, []>("op_453_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_453_cast_fp16 = slice_by_index(begin = var_453_begin_0, end = var_453_end_0, end_mask = var_453_end_mask_0, x = transpose_5)[name = tensor<string, []>("op_453_cast_fp16")];
            tensor<int32, [4]> var_457_begin_0 = const()[name = tensor<string, []>("op_457_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 128])];
            tensor<int32, [4]> var_457_end_0 = const()[name = tensor<string, []>("op_457_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 192])];
            tensor<bool, [4]> var_457_end_mask_0 = const()[name = tensor<string, []>("op_457_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_457_cast_fp16 = slice_by_index(begin = var_457_begin_0, end = var_457_end_0, end_mask = var_457_end_mask_0, x = transpose_5)[name = tensor<string, []>("op_457_cast_fp16")];
            tensor<int32, [4]> var_461_begin_0 = const()[name = tensor<string, []>("op_461_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 192])];
            tensor<int32, [4]> var_461_end_0 = const()[name = tensor<string, []>("op_461_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 256])];
            tensor<bool, [4]> var_461_end_mask_0 = const()[name = tensor<string, []>("op_461_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_461_cast_fp16 = slice_by_index(begin = var_461_begin_0, end = var_461_end_0, end_mask = var_461_end_mask_0, x = transpose_5)[name = tensor<string, []>("op_461_cast_fp16")];
            tensor<int32, [4]> var_465_begin_0 = const()[name = tensor<string, []>("op_465_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 256])];
            tensor<int32, [4]> var_465_end_0 = const()[name = tensor<string, []>("op_465_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 320])];
            tensor<bool, [4]> var_465_end_mask_0 = const()[name = tensor<string, []>("op_465_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_465_cast_fp16 = slice_by_index(begin = var_465_begin_0, end = var_465_end_0, end_mask = var_465_end_mask_0, x = transpose_5)[name = tensor<string, []>("op_465_cast_fp16")];
            tensor<int32, [4]> var_469_begin_0 = const()[name = tensor<string, []>("op_469_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 320])];
            tensor<int32, [4]> var_469_end_0 = const()[name = tensor<string, []>("op_469_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 384])];
            tensor<bool, [4]> var_469_end_mask_0 = const()[name = tensor<string, []>("op_469_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_469_cast_fp16 = slice_by_index(begin = var_469_begin_0, end = var_469_end_0, end_mask = var_469_end_mask_0, x = transpose_5)[name = tensor<string, []>("op_469_cast_fp16")];
            tensor<int32, [4]> var_473_begin_0 = const()[name = tensor<string, []>("op_473_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 384])];
            tensor<int32, [4]> var_473_end_0 = const()[name = tensor<string, []>("op_473_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 448])];
            tensor<bool, [4]> var_473_end_mask_0 = const()[name = tensor<string, []>("op_473_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_473_cast_fp16 = slice_by_index(begin = var_473_begin_0, end = var_473_end_0, end_mask = var_473_end_mask_0, x = transpose_5)[name = tensor<string, []>("op_473_cast_fp16")];
            tensor<int32, [4]> var_477_begin_0 = const()[name = tensor<string, []>("op_477_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 448])];
            tensor<int32, [4]> var_477_end_0 = const()[name = tensor<string, []>("op_477_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 512])];
            tensor<bool, [4]> var_477_end_mask_0 = const()[name = tensor<string, []>("op_477_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_477_cast_fp16 = slice_by_index(begin = var_477_begin_0, end = var_477_end_0, end_mask = var_477_end_mask_0, x = transpose_5)[name = tensor<string, []>("op_477_cast_fp16")];
            tensor<int32, [4]> var_479_begin_0 = const()[name = tensor<string, []>("op_479_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_479_end_0 = const()[name = tensor<string, []>("op_479_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_479_end_mask_0 = const()[name = tensor<string, []>("op_479_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_479_cast_fp16 = slice_by_index(begin = var_479_begin_0, end = var_479_end_0, end_mask = var_479_end_mask_0, x = value_1_cast_fp16)[name = tensor<string, []>("op_479_cast_fp16")];
            tensor<int32, [4]> var_483_begin_0 = const()[name = tensor<string, []>("op_483_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_483_end_0 = const()[name = tensor<string, []>("op_483_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_483_end_mask_0 = const()[name = tensor<string, []>("op_483_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_483_cast_fp16 = slice_by_index(begin = var_483_begin_0, end = var_483_end_0, end_mask = var_483_end_mask_0, x = value_1_cast_fp16)[name = tensor<string, []>("op_483_cast_fp16")];
            tensor<int32, [4]> var_487_begin_0 = const()[name = tensor<string, []>("op_487_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_487_end_0 = const()[name = tensor<string, []>("op_487_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_487_end_mask_0 = const()[name = tensor<string, []>("op_487_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_487_cast_fp16 = slice_by_index(begin = var_487_begin_0, end = var_487_end_0, end_mask = var_487_end_mask_0, x = value_1_cast_fp16)[name = tensor<string, []>("op_487_cast_fp16")];
            tensor<int32, [4]> var_491_begin_0 = const()[name = tensor<string, []>("op_491_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_491_end_0 = const()[name = tensor<string, []>("op_491_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_491_end_mask_0 = const()[name = tensor<string, []>("op_491_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_491_cast_fp16 = slice_by_index(begin = var_491_begin_0, end = var_491_end_0, end_mask = var_491_end_mask_0, x = value_1_cast_fp16)[name = tensor<string, []>("op_491_cast_fp16")];
            tensor<int32, [4]> var_495_begin_0 = const()[name = tensor<string, []>("op_495_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_495_end_0 = const()[name = tensor<string, []>("op_495_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_495_end_mask_0 = const()[name = tensor<string, []>("op_495_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_495_cast_fp16 = slice_by_index(begin = var_495_begin_0, end = var_495_end_0, end_mask = var_495_end_mask_0, x = value_1_cast_fp16)[name = tensor<string, []>("op_495_cast_fp16")];
            tensor<int32, [4]> var_499_begin_0 = const()[name = tensor<string, []>("op_499_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_499_end_0 = const()[name = tensor<string, []>("op_499_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_499_end_mask_0 = const()[name = tensor<string, []>("op_499_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_499_cast_fp16 = slice_by_index(begin = var_499_begin_0, end = var_499_end_0, end_mask = var_499_end_mask_0, x = value_1_cast_fp16)[name = tensor<string, []>("op_499_cast_fp16")];
            tensor<int32, [4]> var_503_begin_0 = const()[name = tensor<string, []>("op_503_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_503_end_0 = const()[name = tensor<string, []>("op_503_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_503_end_mask_0 = const()[name = tensor<string, []>("op_503_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_503_cast_fp16 = slice_by_index(begin = var_503_begin_0, end = var_503_end_0, end_mask = var_503_end_mask_0, x = value_1_cast_fp16)[name = tensor<string, []>("op_503_cast_fp16")];
            tensor<int32, [4]> var_507_begin_0 = const()[name = tensor<string, []>("op_507_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_507_end_0 = const()[name = tensor<string, []>("op_507_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_507_end_mask_0 = const()[name = tensor<string, []>("op_507_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_507_cast_fp16 = slice_by_index(begin = var_507_begin_0, end = var_507_end_0, end_mask = var_507_end_mask_0, x = value_1_cast_fp16)[name = tensor<string, []>("op_507_cast_fp16")];
            tensor<string, []> var_511_equation_0 = const()[name = tensor<string, []>("op_511_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_511_cast_fp16 = einsum(equation = var_511_equation_0, values = (var_449_cast_fp16, var_227_cast_fp16))[name = tensor<string, []>("op_511_cast_fp16")];
            tensor<fp16, []> var_512_to_fp16 = const()[name = tensor<string, []>("op_512_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_1_cast_fp16 = mul(x = var_511_cast_fp16, y = var_512_to_fp16)[name = tensor<string, []>("aw_chunk_1_cast_fp16")];
            tensor<string, []> var_515_equation_0 = const()[name = tensor<string, []>("op_515_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_515_cast_fp16 = einsum(equation = var_515_equation_0, values = (var_449_cast_fp16, var_234_cast_fp16))[name = tensor<string, []>("op_515_cast_fp16")];
            tensor<fp16, []> var_516_to_fp16 = const()[name = tensor<string, []>("op_516_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_3_cast_fp16 = mul(x = var_515_cast_fp16, y = var_516_to_fp16)[name = tensor<string, []>("aw_chunk_3_cast_fp16")];
            tensor<string, []> var_519_equation_0 = const()[name = tensor<string, []>("op_519_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_519_cast_fp16 = einsum(equation = var_519_equation_0, values = (var_449_cast_fp16, var_241_cast_fp16))[name = tensor<string, []>("op_519_cast_fp16")];
            tensor<fp16, []> var_520_to_fp16 = const()[name = tensor<string, []>("op_520_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_5_cast_fp16 = mul(x = var_519_cast_fp16, y = var_520_to_fp16)[name = tensor<string, []>("aw_chunk_5_cast_fp16")];
            tensor<string, []> var_523_equation_0 = const()[name = tensor<string, []>("op_523_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_523_cast_fp16 = einsum(equation = var_523_equation_0, values = (var_449_cast_fp16, var_248_cast_fp16))[name = tensor<string, []>("op_523_cast_fp16")];
            tensor<fp16, []> var_524_to_fp16 = const()[name = tensor<string, []>("op_524_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_7_cast_fp16 = mul(x = var_523_cast_fp16, y = var_524_to_fp16)[name = tensor<string, []>("aw_chunk_7_cast_fp16")];
            tensor<string, []> var_527_equation_0 = const()[name = tensor<string, []>("op_527_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_527_cast_fp16 = einsum(equation = var_527_equation_0, values = (var_453_cast_fp16, var_255_cast_fp16))[name = tensor<string, []>("op_527_cast_fp16")];
            tensor<fp16, []> var_528_to_fp16 = const()[name = tensor<string, []>("op_528_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_9_cast_fp16 = mul(x = var_527_cast_fp16, y = var_528_to_fp16)[name = tensor<string, []>("aw_chunk_9_cast_fp16")];
            tensor<string, []> var_531_equation_0 = const()[name = tensor<string, []>("op_531_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_531_cast_fp16 = einsum(equation = var_531_equation_0, values = (var_453_cast_fp16, var_262_cast_fp16))[name = tensor<string, []>("op_531_cast_fp16")];
            tensor<fp16, []> var_532_to_fp16 = const()[name = tensor<string, []>("op_532_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_11_cast_fp16 = mul(x = var_531_cast_fp16, y = var_532_to_fp16)[name = tensor<string, []>("aw_chunk_11_cast_fp16")];
            tensor<string, []> var_535_equation_0 = const()[name = tensor<string, []>("op_535_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_535_cast_fp16 = einsum(equation = var_535_equation_0, values = (var_453_cast_fp16, var_269_cast_fp16))[name = tensor<string, []>("op_535_cast_fp16")];
            tensor<fp16, []> var_536_to_fp16 = const()[name = tensor<string, []>("op_536_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_13_cast_fp16 = mul(x = var_535_cast_fp16, y = var_536_to_fp16)[name = tensor<string, []>("aw_chunk_13_cast_fp16")];
            tensor<string, []> var_539_equation_0 = const()[name = tensor<string, []>("op_539_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_539_cast_fp16 = einsum(equation = var_539_equation_0, values = (var_453_cast_fp16, var_276_cast_fp16))[name = tensor<string, []>("op_539_cast_fp16")];
            tensor<fp16, []> var_540_to_fp16 = const()[name = tensor<string, []>("op_540_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_15_cast_fp16 = mul(x = var_539_cast_fp16, y = var_540_to_fp16)[name = tensor<string, []>("aw_chunk_15_cast_fp16")];
            tensor<string, []> var_543_equation_0 = const()[name = tensor<string, []>("op_543_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_543_cast_fp16 = einsum(equation = var_543_equation_0, values = (var_457_cast_fp16, var_283_cast_fp16))[name = tensor<string, []>("op_543_cast_fp16")];
            tensor<fp16, []> var_544_to_fp16 = const()[name = tensor<string, []>("op_544_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_17_cast_fp16 = mul(x = var_543_cast_fp16, y = var_544_to_fp16)[name = tensor<string, []>("aw_chunk_17_cast_fp16")];
            tensor<string, []> var_547_equation_0 = const()[name = tensor<string, []>("op_547_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_547_cast_fp16 = einsum(equation = var_547_equation_0, values = (var_457_cast_fp16, var_290_cast_fp16))[name = tensor<string, []>("op_547_cast_fp16")];
            tensor<fp16, []> var_548_to_fp16 = const()[name = tensor<string, []>("op_548_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_19_cast_fp16 = mul(x = var_547_cast_fp16, y = var_548_to_fp16)[name = tensor<string, []>("aw_chunk_19_cast_fp16")];
            tensor<string, []> var_551_equation_0 = const()[name = tensor<string, []>("op_551_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_551_cast_fp16 = einsum(equation = var_551_equation_0, values = (var_457_cast_fp16, var_297_cast_fp16))[name = tensor<string, []>("op_551_cast_fp16")];
            tensor<fp16, []> var_552_to_fp16 = const()[name = tensor<string, []>("op_552_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_21_cast_fp16 = mul(x = var_551_cast_fp16, y = var_552_to_fp16)[name = tensor<string, []>("aw_chunk_21_cast_fp16")];
            tensor<string, []> var_555_equation_0 = const()[name = tensor<string, []>("op_555_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_555_cast_fp16 = einsum(equation = var_555_equation_0, values = (var_457_cast_fp16, var_304_cast_fp16))[name = tensor<string, []>("op_555_cast_fp16")];
            tensor<fp16, []> var_556_to_fp16 = const()[name = tensor<string, []>("op_556_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_23_cast_fp16 = mul(x = var_555_cast_fp16, y = var_556_to_fp16)[name = tensor<string, []>("aw_chunk_23_cast_fp16")];
            tensor<string, []> var_559_equation_0 = const()[name = tensor<string, []>("op_559_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_559_cast_fp16 = einsum(equation = var_559_equation_0, values = (var_461_cast_fp16, var_311_cast_fp16))[name = tensor<string, []>("op_559_cast_fp16")];
            tensor<fp16, []> var_560_to_fp16 = const()[name = tensor<string, []>("op_560_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_25_cast_fp16 = mul(x = var_559_cast_fp16, y = var_560_to_fp16)[name = tensor<string, []>("aw_chunk_25_cast_fp16")];
            tensor<string, []> var_563_equation_0 = const()[name = tensor<string, []>("op_563_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_563_cast_fp16 = einsum(equation = var_563_equation_0, values = (var_461_cast_fp16, var_318_cast_fp16))[name = tensor<string, []>("op_563_cast_fp16")];
            tensor<fp16, []> var_564_to_fp16 = const()[name = tensor<string, []>("op_564_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_27_cast_fp16 = mul(x = var_563_cast_fp16, y = var_564_to_fp16)[name = tensor<string, []>("aw_chunk_27_cast_fp16")];
            tensor<string, []> var_567_equation_0 = const()[name = tensor<string, []>("op_567_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_567_cast_fp16 = einsum(equation = var_567_equation_0, values = (var_461_cast_fp16, var_325_cast_fp16))[name = tensor<string, []>("op_567_cast_fp16")];
            tensor<fp16, []> var_568_to_fp16 = const()[name = tensor<string, []>("op_568_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_29_cast_fp16 = mul(x = var_567_cast_fp16, y = var_568_to_fp16)[name = tensor<string, []>("aw_chunk_29_cast_fp16")];
            tensor<string, []> var_571_equation_0 = const()[name = tensor<string, []>("op_571_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_571_cast_fp16 = einsum(equation = var_571_equation_0, values = (var_461_cast_fp16, var_332_cast_fp16))[name = tensor<string, []>("op_571_cast_fp16")];
            tensor<fp16, []> var_572_to_fp16 = const()[name = tensor<string, []>("op_572_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_31_cast_fp16 = mul(x = var_571_cast_fp16, y = var_572_to_fp16)[name = tensor<string, []>("aw_chunk_31_cast_fp16")];
            tensor<string, []> var_575_equation_0 = const()[name = tensor<string, []>("op_575_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_575_cast_fp16 = einsum(equation = var_575_equation_0, values = (var_465_cast_fp16, var_339_cast_fp16))[name = tensor<string, []>("op_575_cast_fp16")];
            tensor<fp16, []> var_576_to_fp16 = const()[name = tensor<string, []>("op_576_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_33_cast_fp16 = mul(x = var_575_cast_fp16, y = var_576_to_fp16)[name = tensor<string, []>("aw_chunk_33_cast_fp16")];
            tensor<string, []> var_579_equation_0 = const()[name = tensor<string, []>("op_579_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_579_cast_fp16 = einsum(equation = var_579_equation_0, values = (var_465_cast_fp16, var_346_cast_fp16))[name = tensor<string, []>("op_579_cast_fp16")];
            tensor<fp16, []> var_580_to_fp16 = const()[name = tensor<string, []>("op_580_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_35_cast_fp16 = mul(x = var_579_cast_fp16, y = var_580_to_fp16)[name = tensor<string, []>("aw_chunk_35_cast_fp16")];
            tensor<string, []> var_583_equation_0 = const()[name = tensor<string, []>("op_583_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_583_cast_fp16 = einsum(equation = var_583_equation_0, values = (var_465_cast_fp16, var_353_cast_fp16))[name = tensor<string, []>("op_583_cast_fp16")];
            tensor<fp16, []> var_584_to_fp16 = const()[name = tensor<string, []>("op_584_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_37_cast_fp16 = mul(x = var_583_cast_fp16, y = var_584_to_fp16)[name = tensor<string, []>("aw_chunk_37_cast_fp16")];
            tensor<string, []> var_587_equation_0 = const()[name = tensor<string, []>("op_587_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_587_cast_fp16 = einsum(equation = var_587_equation_0, values = (var_465_cast_fp16, var_360_cast_fp16))[name = tensor<string, []>("op_587_cast_fp16")];
            tensor<fp16, []> var_588_to_fp16 = const()[name = tensor<string, []>("op_588_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_39_cast_fp16 = mul(x = var_587_cast_fp16, y = var_588_to_fp16)[name = tensor<string, []>("aw_chunk_39_cast_fp16")];
            tensor<string, []> var_591_equation_0 = const()[name = tensor<string, []>("op_591_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_591_cast_fp16 = einsum(equation = var_591_equation_0, values = (var_469_cast_fp16, var_367_cast_fp16))[name = tensor<string, []>("op_591_cast_fp16")];
            tensor<fp16, []> var_592_to_fp16 = const()[name = tensor<string, []>("op_592_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_41_cast_fp16 = mul(x = var_591_cast_fp16, y = var_592_to_fp16)[name = tensor<string, []>("aw_chunk_41_cast_fp16")];
            tensor<string, []> var_595_equation_0 = const()[name = tensor<string, []>("op_595_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_595_cast_fp16 = einsum(equation = var_595_equation_0, values = (var_469_cast_fp16, var_374_cast_fp16))[name = tensor<string, []>("op_595_cast_fp16")];
            tensor<fp16, []> var_596_to_fp16 = const()[name = tensor<string, []>("op_596_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_43_cast_fp16 = mul(x = var_595_cast_fp16, y = var_596_to_fp16)[name = tensor<string, []>("aw_chunk_43_cast_fp16")];
            tensor<string, []> var_599_equation_0 = const()[name = tensor<string, []>("op_599_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_599_cast_fp16 = einsum(equation = var_599_equation_0, values = (var_469_cast_fp16, var_381_cast_fp16))[name = tensor<string, []>("op_599_cast_fp16")];
            tensor<fp16, []> var_600_to_fp16 = const()[name = tensor<string, []>("op_600_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_45_cast_fp16 = mul(x = var_599_cast_fp16, y = var_600_to_fp16)[name = tensor<string, []>("aw_chunk_45_cast_fp16")];
            tensor<string, []> var_603_equation_0 = const()[name = tensor<string, []>("op_603_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_603_cast_fp16 = einsum(equation = var_603_equation_0, values = (var_469_cast_fp16, var_388_cast_fp16))[name = tensor<string, []>("op_603_cast_fp16")];
            tensor<fp16, []> var_604_to_fp16 = const()[name = tensor<string, []>("op_604_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_47_cast_fp16 = mul(x = var_603_cast_fp16, y = var_604_to_fp16)[name = tensor<string, []>("aw_chunk_47_cast_fp16")];
            tensor<string, []> var_607_equation_0 = const()[name = tensor<string, []>("op_607_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_607_cast_fp16 = einsum(equation = var_607_equation_0, values = (var_473_cast_fp16, var_395_cast_fp16))[name = tensor<string, []>("op_607_cast_fp16")];
            tensor<fp16, []> var_608_to_fp16 = const()[name = tensor<string, []>("op_608_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_49_cast_fp16 = mul(x = var_607_cast_fp16, y = var_608_to_fp16)[name = tensor<string, []>("aw_chunk_49_cast_fp16")];
            tensor<string, []> var_611_equation_0 = const()[name = tensor<string, []>("op_611_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_611_cast_fp16 = einsum(equation = var_611_equation_0, values = (var_473_cast_fp16, var_402_cast_fp16))[name = tensor<string, []>("op_611_cast_fp16")];
            tensor<fp16, []> var_612_to_fp16 = const()[name = tensor<string, []>("op_612_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_51_cast_fp16 = mul(x = var_611_cast_fp16, y = var_612_to_fp16)[name = tensor<string, []>("aw_chunk_51_cast_fp16")];
            tensor<string, []> var_615_equation_0 = const()[name = tensor<string, []>("op_615_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_615_cast_fp16 = einsum(equation = var_615_equation_0, values = (var_473_cast_fp16, var_409_cast_fp16))[name = tensor<string, []>("op_615_cast_fp16")];
            tensor<fp16, []> var_616_to_fp16 = const()[name = tensor<string, []>("op_616_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_53_cast_fp16 = mul(x = var_615_cast_fp16, y = var_616_to_fp16)[name = tensor<string, []>("aw_chunk_53_cast_fp16")];
            tensor<string, []> var_619_equation_0 = const()[name = tensor<string, []>("op_619_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_619_cast_fp16 = einsum(equation = var_619_equation_0, values = (var_473_cast_fp16, var_416_cast_fp16))[name = tensor<string, []>("op_619_cast_fp16")];
            tensor<fp16, []> var_620_to_fp16 = const()[name = tensor<string, []>("op_620_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_55_cast_fp16 = mul(x = var_619_cast_fp16, y = var_620_to_fp16)[name = tensor<string, []>("aw_chunk_55_cast_fp16")];
            tensor<string, []> var_623_equation_0 = const()[name = tensor<string, []>("op_623_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_623_cast_fp16 = einsum(equation = var_623_equation_0, values = (var_477_cast_fp16, var_423_cast_fp16))[name = tensor<string, []>("op_623_cast_fp16")];
            tensor<fp16, []> var_624_to_fp16 = const()[name = tensor<string, []>("op_624_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_57_cast_fp16 = mul(x = var_623_cast_fp16, y = var_624_to_fp16)[name = tensor<string, []>("aw_chunk_57_cast_fp16")];
            tensor<string, []> var_627_equation_0 = const()[name = tensor<string, []>("op_627_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_627_cast_fp16 = einsum(equation = var_627_equation_0, values = (var_477_cast_fp16, var_430_cast_fp16))[name = tensor<string, []>("op_627_cast_fp16")];
            tensor<fp16, []> var_628_to_fp16 = const()[name = tensor<string, []>("op_628_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_59_cast_fp16 = mul(x = var_627_cast_fp16, y = var_628_to_fp16)[name = tensor<string, []>("aw_chunk_59_cast_fp16")];
            tensor<string, []> var_631_equation_0 = const()[name = tensor<string, []>("op_631_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_631_cast_fp16 = einsum(equation = var_631_equation_0, values = (var_477_cast_fp16, var_437_cast_fp16))[name = tensor<string, []>("op_631_cast_fp16")];
            tensor<fp16, []> var_632_to_fp16 = const()[name = tensor<string, []>("op_632_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_61_cast_fp16 = mul(x = var_631_cast_fp16, y = var_632_to_fp16)[name = tensor<string, []>("aw_chunk_61_cast_fp16")];
            tensor<string, []> var_635_equation_0 = const()[name = tensor<string, []>("op_635_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_635_cast_fp16 = einsum(equation = var_635_equation_0, values = (var_477_cast_fp16, var_444_cast_fp16))[name = tensor<string, []>("op_635_cast_fp16")];
            tensor<fp16, []> var_636_to_fp16 = const()[name = tensor<string, []>("op_636_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_63_cast_fp16 = mul(x = var_635_cast_fp16, y = var_636_to_fp16)[name = tensor<string, []>("aw_chunk_63_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_638_cast_fp16 = softmax(axis = var_135, x = aw_chunk_1_cast_fp16)[name = tensor<string, []>("op_638_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_639_cast_fp16 = softmax(axis = var_135, x = aw_chunk_3_cast_fp16)[name = tensor<string, []>("op_639_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_640_cast_fp16 = softmax(axis = var_135, x = aw_chunk_5_cast_fp16)[name = tensor<string, []>("op_640_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_641_cast_fp16 = softmax(axis = var_135, x = aw_chunk_7_cast_fp16)[name = tensor<string, []>("op_641_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_642_cast_fp16 = softmax(axis = var_135, x = aw_chunk_9_cast_fp16)[name = tensor<string, []>("op_642_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_643_cast_fp16 = softmax(axis = var_135, x = aw_chunk_11_cast_fp16)[name = tensor<string, []>("op_643_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_644_cast_fp16 = softmax(axis = var_135, x = aw_chunk_13_cast_fp16)[name = tensor<string, []>("op_644_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_645_cast_fp16 = softmax(axis = var_135, x = aw_chunk_15_cast_fp16)[name = tensor<string, []>("op_645_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_646_cast_fp16 = softmax(axis = var_135, x = aw_chunk_17_cast_fp16)[name = tensor<string, []>("op_646_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_647_cast_fp16 = softmax(axis = var_135, x = aw_chunk_19_cast_fp16)[name = tensor<string, []>("op_647_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_648_cast_fp16 = softmax(axis = var_135, x = aw_chunk_21_cast_fp16)[name = tensor<string, []>("op_648_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_649_cast_fp16 = softmax(axis = var_135, x = aw_chunk_23_cast_fp16)[name = tensor<string, []>("op_649_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_650_cast_fp16 = softmax(axis = var_135, x = aw_chunk_25_cast_fp16)[name = tensor<string, []>("op_650_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_651_cast_fp16 = softmax(axis = var_135, x = aw_chunk_27_cast_fp16)[name = tensor<string, []>("op_651_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_652_cast_fp16 = softmax(axis = var_135, x = aw_chunk_29_cast_fp16)[name = tensor<string, []>("op_652_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_653_cast_fp16 = softmax(axis = var_135, x = aw_chunk_31_cast_fp16)[name = tensor<string, []>("op_653_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_654_cast_fp16 = softmax(axis = var_135, x = aw_chunk_33_cast_fp16)[name = tensor<string, []>("op_654_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_655_cast_fp16 = softmax(axis = var_135, x = aw_chunk_35_cast_fp16)[name = tensor<string, []>("op_655_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_656_cast_fp16 = softmax(axis = var_135, x = aw_chunk_37_cast_fp16)[name = tensor<string, []>("op_656_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_657_cast_fp16 = softmax(axis = var_135, x = aw_chunk_39_cast_fp16)[name = tensor<string, []>("op_657_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_658_cast_fp16 = softmax(axis = var_135, x = aw_chunk_41_cast_fp16)[name = tensor<string, []>("op_658_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_659_cast_fp16 = softmax(axis = var_135, x = aw_chunk_43_cast_fp16)[name = tensor<string, []>("op_659_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_660_cast_fp16 = softmax(axis = var_135, x = aw_chunk_45_cast_fp16)[name = tensor<string, []>("op_660_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_661_cast_fp16 = softmax(axis = var_135, x = aw_chunk_47_cast_fp16)[name = tensor<string, []>("op_661_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_662_cast_fp16 = softmax(axis = var_135, x = aw_chunk_49_cast_fp16)[name = tensor<string, []>("op_662_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_663_cast_fp16 = softmax(axis = var_135, x = aw_chunk_51_cast_fp16)[name = tensor<string, []>("op_663_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_664_cast_fp16 = softmax(axis = var_135, x = aw_chunk_53_cast_fp16)[name = tensor<string, []>("op_664_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_665_cast_fp16 = softmax(axis = var_135, x = aw_chunk_55_cast_fp16)[name = tensor<string, []>("op_665_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_666_cast_fp16 = softmax(axis = var_135, x = aw_chunk_57_cast_fp16)[name = tensor<string, []>("op_666_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_667_cast_fp16 = softmax(axis = var_135, x = aw_chunk_59_cast_fp16)[name = tensor<string, []>("op_667_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_668_cast_fp16 = softmax(axis = var_135, x = aw_chunk_61_cast_fp16)[name = tensor<string, []>("op_668_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_669_cast_fp16 = softmax(axis = var_135, x = aw_chunk_63_cast_fp16)[name = tensor<string, []>("op_669_cast_fp16")];
            tensor<string, []> var_671_equation_0 = const()[name = tensor<string, []>("op_671_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_671_cast_fp16 = einsum(equation = var_671_equation_0, values = (var_479_cast_fp16, var_638_cast_fp16))[name = tensor<string, []>("op_671_cast_fp16")];
            tensor<string, []> var_673_equation_0 = const()[name = tensor<string, []>("op_673_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_673_cast_fp16 = einsum(equation = var_673_equation_0, values = (var_479_cast_fp16, var_639_cast_fp16))[name = tensor<string, []>("op_673_cast_fp16")];
            tensor<string, []> var_675_equation_0 = const()[name = tensor<string, []>("op_675_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_675_cast_fp16 = einsum(equation = var_675_equation_0, values = (var_479_cast_fp16, var_640_cast_fp16))[name = tensor<string, []>("op_675_cast_fp16")];
            tensor<string, []> var_677_equation_0 = const()[name = tensor<string, []>("op_677_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_677_cast_fp16 = einsum(equation = var_677_equation_0, values = (var_479_cast_fp16, var_641_cast_fp16))[name = tensor<string, []>("op_677_cast_fp16")];
            tensor<string, []> var_679_equation_0 = const()[name = tensor<string, []>("op_679_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_679_cast_fp16 = einsum(equation = var_679_equation_0, values = (var_483_cast_fp16, var_642_cast_fp16))[name = tensor<string, []>("op_679_cast_fp16")];
            tensor<string, []> var_681_equation_0 = const()[name = tensor<string, []>("op_681_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_681_cast_fp16 = einsum(equation = var_681_equation_0, values = (var_483_cast_fp16, var_643_cast_fp16))[name = tensor<string, []>("op_681_cast_fp16")];
            tensor<string, []> var_683_equation_0 = const()[name = tensor<string, []>("op_683_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_683_cast_fp16 = einsum(equation = var_683_equation_0, values = (var_483_cast_fp16, var_644_cast_fp16))[name = tensor<string, []>("op_683_cast_fp16")];
            tensor<string, []> var_685_equation_0 = const()[name = tensor<string, []>("op_685_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_685_cast_fp16 = einsum(equation = var_685_equation_0, values = (var_483_cast_fp16, var_645_cast_fp16))[name = tensor<string, []>("op_685_cast_fp16")];
            tensor<string, []> var_687_equation_0 = const()[name = tensor<string, []>("op_687_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_687_cast_fp16 = einsum(equation = var_687_equation_0, values = (var_487_cast_fp16, var_646_cast_fp16))[name = tensor<string, []>("op_687_cast_fp16")];
            tensor<string, []> var_689_equation_0 = const()[name = tensor<string, []>("op_689_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_689_cast_fp16 = einsum(equation = var_689_equation_0, values = (var_487_cast_fp16, var_647_cast_fp16))[name = tensor<string, []>("op_689_cast_fp16")];
            tensor<string, []> var_691_equation_0 = const()[name = tensor<string, []>("op_691_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_691_cast_fp16 = einsum(equation = var_691_equation_0, values = (var_487_cast_fp16, var_648_cast_fp16))[name = tensor<string, []>("op_691_cast_fp16")];
            tensor<string, []> var_693_equation_0 = const()[name = tensor<string, []>("op_693_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_693_cast_fp16 = einsum(equation = var_693_equation_0, values = (var_487_cast_fp16, var_649_cast_fp16))[name = tensor<string, []>("op_693_cast_fp16")];
            tensor<string, []> var_695_equation_0 = const()[name = tensor<string, []>("op_695_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_695_cast_fp16 = einsum(equation = var_695_equation_0, values = (var_491_cast_fp16, var_650_cast_fp16))[name = tensor<string, []>("op_695_cast_fp16")];
            tensor<string, []> var_697_equation_0 = const()[name = tensor<string, []>("op_697_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_697_cast_fp16 = einsum(equation = var_697_equation_0, values = (var_491_cast_fp16, var_651_cast_fp16))[name = tensor<string, []>("op_697_cast_fp16")];
            tensor<string, []> var_699_equation_0 = const()[name = tensor<string, []>("op_699_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_699_cast_fp16 = einsum(equation = var_699_equation_0, values = (var_491_cast_fp16, var_652_cast_fp16))[name = tensor<string, []>("op_699_cast_fp16")];
            tensor<string, []> var_701_equation_0 = const()[name = tensor<string, []>("op_701_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_701_cast_fp16 = einsum(equation = var_701_equation_0, values = (var_491_cast_fp16, var_653_cast_fp16))[name = tensor<string, []>("op_701_cast_fp16")];
            tensor<string, []> var_703_equation_0 = const()[name = tensor<string, []>("op_703_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_703_cast_fp16 = einsum(equation = var_703_equation_0, values = (var_495_cast_fp16, var_654_cast_fp16))[name = tensor<string, []>("op_703_cast_fp16")];
            tensor<string, []> var_705_equation_0 = const()[name = tensor<string, []>("op_705_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_705_cast_fp16 = einsum(equation = var_705_equation_0, values = (var_495_cast_fp16, var_655_cast_fp16))[name = tensor<string, []>("op_705_cast_fp16")];
            tensor<string, []> var_707_equation_0 = const()[name = tensor<string, []>("op_707_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_707_cast_fp16 = einsum(equation = var_707_equation_0, values = (var_495_cast_fp16, var_656_cast_fp16))[name = tensor<string, []>("op_707_cast_fp16")];
            tensor<string, []> var_709_equation_0 = const()[name = tensor<string, []>("op_709_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_709_cast_fp16 = einsum(equation = var_709_equation_0, values = (var_495_cast_fp16, var_657_cast_fp16))[name = tensor<string, []>("op_709_cast_fp16")];
            tensor<string, []> var_711_equation_0 = const()[name = tensor<string, []>("op_711_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_711_cast_fp16 = einsum(equation = var_711_equation_0, values = (var_499_cast_fp16, var_658_cast_fp16))[name = tensor<string, []>("op_711_cast_fp16")];
            tensor<string, []> var_713_equation_0 = const()[name = tensor<string, []>("op_713_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_713_cast_fp16 = einsum(equation = var_713_equation_0, values = (var_499_cast_fp16, var_659_cast_fp16))[name = tensor<string, []>("op_713_cast_fp16")];
            tensor<string, []> var_715_equation_0 = const()[name = tensor<string, []>("op_715_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_715_cast_fp16 = einsum(equation = var_715_equation_0, values = (var_499_cast_fp16, var_660_cast_fp16))[name = tensor<string, []>("op_715_cast_fp16")];
            tensor<string, []> var_717_equation_0 = const()[name = tensor<string, []>("op_717_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_717_cast_fp16 = einsum(equation = var_717_equation_0, values = (var_499_cast_fp16, var_661_cast_fp16))[name = tensor<string, []>("op_717_cast_fp16")];
            tensor<string, []> var_719_equation_0 = const()[name = tensor<string, []>("op_719_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_719_cast_fp16 = einsum(equation = var_719_equation_0, values = (var_503_cast_fp16, var_662_cast_fp16))[name = tensor<string, []>("op_719_cast_fp16")];
            tensor<string, []> var_721_equation_0 = const()[name = tensor<string, []>("op_721_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_721_cast_fp16 = einsum(equation = var_721_equation_0, values = (var_503_cast_fp16, var_663_cast_fp16))[name = tensor<string, []>("op_721_cast_fp16")];
            tensor<string, []> var_723_equation_0 = const()[name = tensor<string, []>("op_723_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_723_cast_fp16 = einsum(equation = var_723_equation_0, values = (var_503_cast_fp16, var_664_cast_fp16))[name = tensor<string, []>("op_723_cast_fp16")];
            tensor<string, []> var_725_equation_0 = const()[name = tensor<string, []>("op_725_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_725_cast_fp16 = einsum(equation = var_725_equation_0, values = (var_503_cast_fp16, var_665_cast_fp16))[name = tensor<string, []>("op_725_cast_fp16")];
            tensor<string, []> var_727_equation_0 = const()[name = tensor<string, []>("op_727_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_727_cast_fp16 = einsum(equation = var_727_equation_0, values = (var_507_cast_fp16, var_666_cast_fp16))[name = tensor<string, []>("op_727_cast_fp16")];
            tensor<string, []> var_729_equation_0 = const()[name = tensor<string, []>("op_729_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_729_cast_fp16 = einsum(equation = var_729_equation_0, values = (var_507_cast_fp16, var_667_cast_fp16))[name = tensor<string, []>("op_729_cast_fp16")];
            tensor<string, []> var_731_equation_0 = const()[name = tensor<string, []>("op_731_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_731_cast_fp16 = einsum(equation = var_731_equation_0, values = (var_507_cast_fp16, var_668_cast_fp16))[name = tensor<string, []>("op_731_cast_fp16")];
            tensor<string, []> var_733_equation_0 = const()[name = tensor<string, []>("op_733_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_733_cast_fp16 = einsum(equation = var_733_equation_0, values = (var_507_cast_fp16, var_669_cast_fp16))[name = tensor<string, []>("op_733_cast_fp16")];
            tensor<bool, []> var_735_interleave_0 = const()[name = tensor<string, []>("op_735_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_735_cast_fp16 = concat(axis = var_122, interleave = var_735_interleave_0, values = (var_671_cast_fp16, var_673_cast_fp16, var_675_cast_fp16, var_677_cast_fp16))[name = tensor<string, []>("op_735_cast_fp16")];
            tensor<bool, []> var_737_interleave_0 = const()[name = tensor<string, []>("op_737_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_737_cast_fp16 = concat(axis = var_122, interleave = var_737_interleave_0, values = (var_679_cast_fp16, var_681_cast_fp16, var_683_cast_fp16, var_685_cast_fp16))[name = tensor<string, []>("op_737_cast_fp16")];
            tensor<bool, []> var_739_interleave_0 = const()[name = tensor<string, []>("op_739_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_739_cast_fp16 = concat(axis = var_122, interleave = var_739_interleave_0, values = (var_687_cast_fp16, var_689_cast_fp16, var_691_cast_fp16, var_693_cast_fp16))[name = tensor<string, []>("op_739_cast_fp16")];
            tensor<bool, []> var_741_interleave_0 = const()[name = tensor<string, []>("op_741_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_741_cast_fp16 = concat(axis = var_122, interleave = var_741_interleave_0, values = (var_695_cast_fp16, var_697_cast_fp16, var_699_cast_fp16, var_701_cast_fp16))[name = tensor<string, []>("op_741_cast_fp16")];
            tensor<bool, []> var_743_interleave_0 = const()[name = tensor<string, []>("op_743_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_743_cast_fp16 = concat(axis = var_122, interleave = var_743_interleave_0, values = (var_703_cast_fp16, var_705_cast_fp16, var_707_cast_fp16, var_709_cast_fp16))[name = tensor<string, []>("op_743_cast_fp16")];
            tensor<bool, []> var_745_interleave_0 = const()[name = tensor<string, []>("op_745_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_745_cast_fp16 = concat(axis = var_122, interleave = var_745_interleave_0, values = (var_711_cast_fp16, var_713_cast_fp16, var_715_cast_fp16, var_717_cast_fp16))[name = tensor<string, []>("op_745_cast_fp16")];
            tensor<bool, []> var_747_interleave_0 = const()[name = tensor<string, []>("op_747_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_747_cast_fp16 = concat(axis = var_122, interleave = var_747_interleave_0, values = (var_719_cast_fp16, var_721_cast_fp16, var_723_cast_fp16, var_725_cast_fp16))[name = tensor<string, []>("op_747_cast_fp16")];
            tensor<bool, []> var_749_interleave_0 = const()[name = tensor<string, []>("op_749_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_749_cast_fp16 = concat(axis = var_122, interleave = var_749_interleave_0, values = (var_727_cast_fp16, var_729_cast_fp16, var_731_cast_fp16, var_733_cast_fp16))[name = tensor<string, []>("op_749_cast_fp16")];
            tensor<bool, []> input_1_interleave_0 = const()[name = tensor<string, []>("input_1_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 512, 1, 1500]> input_1_cast_fp16 = concat(axis = var_135, interleave = input_1_interleave_0, values = (var_735_cast_fp16, var_737_cast_fp16, var_739_cast_fp16, var_741_cast_fp16, var_743_cast_fp16, var_745_cast_fp16, var_747_cast_fp16, var_749_cast_fp16))[name = tensor<string, []>("input_1_cast_fp16")];
            tensor<int32, [2]> var_754 = const()[name = tensor<string, []>("op_754"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_756 = const()[name = tensor<string, []>("op_756"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_3_pad_type_0 = const()[name = tensor<string, []>("obj_3_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_3_pad_0 = const()[name = tensor<string, []>("obj_3_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_0_self_attn_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_o_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(4936640)))];
            tensor<fp16, [512]> layers_0_self_attn_o_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_self_attn_o_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5460992)))];
            tensor<fp16, [1, 512, 1, 1500]> obj_3_cast_fp16 = conv(bias = layers_0_self_attn_o_proj_bias_to_fp16, dilations = var_756, groups = var_135, pad = obj_3_pad_0, pad_type = obj_3_pad_type_0, strides = var_754, weight = layers_0_self_attn_o_proj_weight_to_fp16, x = input_1_cast_fp16)[name = tensor<string, []>("obj_3_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_3_cast_fp16 = add(x = inputs_1_cast_fp16, y = obj_3_cast_fp16)[name = tensor<string, []>("inputs_3_cast_fp16")];
            tensor<int32, [1]> var_762 = const()[name = tensor<string, []>("op_762"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_3_cast_fp16 = reduce_mean(axes = var_762, keep_dims = var_136, x = inputs_3_cast_fp16)[name = tensor<string, []>("channels_mean_3_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_3_cast_fp16 = sub(x = inputs_3_cast_fp16, y = channels_mean_3_cast_fp16)[name = tensor<string, []>("zero_mean_3_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_3_cast_fp16 = mul(x = zero_mean_3_cast_fp16, y = zero_mean_3_cast_fp16)[name = tensor<string, []>("zero_mean_sq_3_cast_fp16")];
            tensor<int32, [1]> var_766 = const()[name = tensor<string, []>("op_766"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_767_cast_fp16 = reduce_mean(axes = var_766, keep_dims = var_136, x = zero_mean_sq_3_cast_fp16)[name = tensor<string, []>("op_767_cast_fp16")];
            tensor<fp16, []> var_768_to_fp16 = const()[name = tensor<string, []>("op_768_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_769_cast_fp16 = add(x = var_767_cast_fp16, y = var_768_to_fp16)[name = tensor<string, []>("op_769_cast_fp16")];
            tensor<fp16, []> denom_3_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_3_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_3_cast_fp16 = rsqrt(epsilon = denom_3_epsilon_0_to_fp16, x = var_769_cast_fp16)[name = tensor<string, []>("denom_3_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_3_cast_fp16 = mul(x = zero_mean_3_cast_fp16, y = denom_3_cast_fp16)[name = tensor<string, []>("out_3_cast_fp16")];
            tensor<fp16, [512]> input_3_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_3_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5462080)))];
            tensor<fp16, [512]> input_3_beta_0_to_fp16 = const()[name = tensor<string, []>("input_3_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5463168)))];
            tensor<fp16, []> input_3_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_3_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> input_3_cast_fp16 = batch_norm(beta = input_3_beta_0_to_fp16, epsilon = input_3_epsilon_0_to_fp16, gamma = input_3_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_3_cast_fp16)[name = tensor<string, []>("input_3_cast_fp16")];
            tensor<int32, [2]> var_780 = const()[name = tensor<string, []>("op_780"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_782 = const()[name = tensor<string, []>("op_782"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> input_5_pad_type_0 = const()[name = tensor<string, []>("input_5_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> input_5_pad_0 = const()[name = tensor<string, []>("input_5_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [2048, 512, 1, 1]> layers_0_fc1_weight_to_fp16 = const()[name = tensor<string, []>("layers_0_fc1_weight_to_fp16"), val = tensor<fp16, [2048, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(5464256)))];
            tensor<fp16, [2048]> layers_0_fc1_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_fc1_bias_to_fp16"), val = tensor<fp16, [2048]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7561472)))];
            tensor<fp16, [1, 2048, 1, 1500]> input_5_cast_fp16 = conv(bias = layers_0_fc1_bias_to_fp16, dilations = var_782, groups = var_135, pad = input_5_pad_0, pad_type = input_5_pad_type_0, strides = var_780, weight = layers_0_fc1_weight_to_fp16, x = input_3_cast_fp16)[name = tensor<string, []>("input_5_cast_fp16")];
            tensor<string, []> input_7_mode_0 = const()[name = tensor<string, []>("input_7_mode_0"), val = tensor<string, []>("EXACT")];
            tensor<fp16, [1, 2048, 1, 1500]> input_7_cast_fp16 = gelu(mode = input_7_mode_0, x = input_5_cast_fp16)[name = tensor<string, []>("input_7_cast_fp16")];
            tensor<int32, [2]> var_788 = const()[name = tensor<string, []>("op_788"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_790 = const()[name = tensor<string, []>("op_790"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> hidden_states_5_pad_type_0 = const()[name = tensor<string, []>("hidden_states_5_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> hidden_states_5_pad_0 = const()[name = tensor<string, []>("hidden_states_5_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 2048, 1, 1]> layers_0_fc2_weight_to_fp16 = const()[name = tensor<string, []>("layers_0_fc2_weight_to_fp16"), val = tensor<fp16, [512, 2048, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(7565632)))];
            tensor<fp16, [512]> layers_0_fc2_bias_to_fp16 = const()[name = tensor<string, []>("layers_0_fc2_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9662848)))];
            tensor<fp16, [1, 512, 1, 1500]> hidden_states_5_cast_fp16 = conv(bias = layers_0_fc2_bias_to_fp16, dilations = var_790, groups = var_135, pad = hidden_states_5_pad_0, pad_type = hidden_states_5_pad_type_0, strides = var_788, weight = layers_0_fc2_weight_to_fp16, x = input_7_cast_fp16)[name = tensor<string, []>("hidden_states_5_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_5_cast_fp16 = add(x = inputs_3_cast_fp16, y = hidden_states_5_cast_fp16)[name = tensor<string, []>("inputs_5_cast_fp16")];
            tensor<int32, []> var_797 = const()[name = tensor<string, []>("op_797"), val = tensor<int32, []>(3)];
            tensor<int32, []> var_810 = const()[name = tensor<string, []>("op_810"), val = tensor<int32, []>(1)];
            tensor<bool, []> var_811 = const()[name = tensor<string, []>("op_811"), val = tensor<bool, []>(true)];
            tensor<int32, [1]> var_821 = const()[name = tensor<string, []>("op_821"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_5_cast_fp16 = reduce_mean(axes = var_821, keep_dims = var_811, x = inputs_5_cast_fp16)[name = tensor<string, []>("channels_mean_5_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_5_cast_fp16 = sub(x = inputs_5_cast_fp16, y = channels_mean_5_cast_fp16)[name = tensor<string, []>("zero_mean_5_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_5_cast_fp16 = mul(x = zero_mean_5_cast_fp16, y = zero_mean_5_cast_fp16)[name = tensor<string, []>("zero_mean_sq_5_cast_fp16")];
            tensor<int32, [1]> var_825 = const()[name = tensor<string, []>("op_825"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_826_cast_fp16 = reduce_mean(axes = var_825, keep_dims = var_811, x = zero_mean_sq_5_cast_fp16)[name = tensor<string, []>("op_826_cast_fp16")];
            tensor<fp16, []> var_827_to_fp16 = const()[name = tensor<string, []>("op_827_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_828_cast_fp16 = add(x = var_826_cast_fp16, y = var_827_to_fp16)[name = tensor<string, []>("op_828_cast_fp16")];
            tensor<fp16, []> denom_5_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_5_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_5_cast_fp16 = rsqrt(epsilon = denom_5_epsilon_0_to_fp16, x = var_828_cast_fp16)[name = tensor<string, []>("denom_5_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_5_cast_fp16 = mul(x = zero_mean_5_cast_fp16, y = denom_5_cast_fp16)[name = tensor<string, []>("out_5_cast_fp16")];
            tensor<fp16, [512]> obj_5_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_5_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9663936)))];
            tensor<fp16, [512]> obj_5_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_5_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9665024)))];
            tensor<fp16, []> obj_5_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_5_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> obj_5_cast_fp16 = batch_norm(beta = obj_5_beta_0_to_fp16, epsilon = obj_5_epsilon_0_to_fp16, gamma = obj_5_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_5_cast_fp16)[name = tensor<string, []>("obj_5_cast_fp16")];
            tensor<int32, [2]> var_843 = const()[name = tensor<string, []>("op_843"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_845 = const()[name = tensor<string, []>("op_845"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_3_pad_type_0 = const()[name = tensor<string, []>("query_3_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_3_pad_0 = const()[name = tensor<string, []>("query_3_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_1_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(9666112)))];
            tensor<fp16, [512]> layers_1_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(10190464)))];
            tensor<fp16, [1, 512, 1, 1500]> query_3_cast_fp16 = conv(bias = layers_1_self_attn_q_proj_bias_to_fp16, dilations = var_845, groups = var_810, pad = query_3_pad_0, pad_type = query_3_pad_type_0, strides = var_843, weight = layers_1_self_attn_q_proj_weight_to_fp16, x = obj_5_cast_fp16)[name = tensor<string, []>("query_3_cast_fp16")];
            tensor<int32, [2]> var_849 = const()[name = tensor<string, []>("op_849"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_851 = const()[name = tensor<string, []>("op_851"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_3_pad_type_0 = const()[name = tensor<string, []>("key_3_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_3_pad_0 = const()[name = tensor<string, []>("key_3_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_1_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(10191552)))];
            tensor<fp16, [1, 512, 1, 1500]> key_3_cast_fp16 = conv(dilations = var_851, groups = var_810, pad = key_3_pad_0, pad_type = key_3_pad_type_0, strides = var_849, weight = layers_1_self_attn_k_proj_weight_to_fp16, x = obj_5_cast_fp16)[name = tensor<string, []>("key_3_cast_fp16")];
            tensor<int32, [2]> var_856 = const()[name = tensor<string, []>("op_856"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_858 = const()[name = tensor<string, []>("op_858"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_3_pad_type_0 = const()[name = tensor<string, []>("value_3_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_3_pad_0 = const()[name = tensor<string, []>("value_3_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_1_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(10715904)))];
            tensor<fp16, [512]> layers_1_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11240256)))];
            tensor<fp16, [1, 512, 1, 1500]> value_3_cast_fp16 = conv(bias = layers_1_self_attn_v_proj_bias_to_fp16, dilations = var_858, groups = var_810, pad = value_3_pad_0, pad_type = value_3_pad_type_0, strides = var_856, weight = layers_1_self_attn_v_proj_weight_to_fp16, x = obj_5_cast_fp16)[name = tensor<string, []>("value_3_cast_fp16")];
            tensor<int32, [4]> var_865_begin_0 = const()[name = tensor<string, []>("op_865_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_865_end_0 = const()[name = tensor<string, []>("op_865_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_865_end_mask_0 = const()[name = tensor<string, []>("op_865_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_865_cast_fp16 = slice_by_index(begin = var_865_begin_0, end = var_865_end_0, end_mask = var_865_end_mask_0, x = query_3_cast_fp16)[name = tensor<string, []>("op_865_cast_fp16")];
            tensor<int32, [4]> var_869_begin_0 = const()[name = tensor<string, []>("op_869_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_869_end_0 = const()[name = tensor<string, []>("op_869_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_869_end_mask_0 = const()[name = tensor<string, []>("op_869_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_869_cast_fp16 = slice_by_index(begin = var_869_begin_0, end = var_869_end_0, end_mask = var_869_end_mask_0, x = query_3_cast_fp16)[name = tensor<string, []>("op_869_cast_fp16")];
            tensor<int32, [4]> var_873_begin_0 = const()[name = tensor<string, []>("op_873_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_873_end_0 = const()[name = tensor<string, []>("op_873_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_873_end_mask_0 = const()[name = tensor<string, []>("op_873_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_873_cast_fp16 = slice_by_index(begin = var_873_begin_0, end = var_873_end_0, end_mask = var_873_end_mask_0, x = query_3_cast_fp16)[name = tensor<string, []>("op_873_cast_fp16")];
            tensor<int32, [4]> var_877_begin_0 = const()[name = tensor<string, []>("op_877_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_877_end_0 = const()[name = tensor<string, []>("op_877_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_877_end_mask_0 = const()[name = tensor<string, []>("op_877_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_877_cast_fp16 = slice_by_index(begin = var_877_begin_0, end = var_877_end_0, end_mask = var_877_end_mask_0, x = query_3_cast_fp16)[name = tensor<string, []>("op_877_cast_fp16")];
            tensor<int32, [4]> var_881_begin_0 = const()[name = tensor<string, []>("op_881_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_881_end_0 = const()[name = tensor<string, []>("op_881_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_881_end_mask_0 = const()[name = tensor<string, []>("op_881_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_881_cast_fp16 = slice_by_index(begin = var_881_begin_0, end = var_881_end_0, end_mask = var_881_end_mask_0, x = query_3_cast_fp16)[name = tensor<string, []>("op_881_cast_fp16")];
            tensor<int32, [4]> var_885_begin_0 = const()[name = tensor<string, []>("op_885_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_885_end_0 = const()[name = tensor<string, []>("op_885_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_885_end_mask_0 = const()[name = tensor<string, []>("op_885_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_885_cast_fp16 = slice_by_index(begin = var_885_begin_0, end = var_885_end_0, end_mask = var_885_end_mask_0, x = query_3_cast_fp16)[name = tensor<string, []>("op_885_cast_fp16")];
            tensor<int32, [4]> var_889_begin_0 = const()[name = tensor<string, []>("op_889_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_889_end_0 = const()[name = tensor<string, []>("op_889_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_889_end_mask_0 = const()[name = tensor<string, []>("op_889_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_889_cast_fp16 = slice_by_index(begin = var_889_begin_0, end = var_889_end_0, end_mask = var_889_end_mask_0, x = query_3_cast_fp16)[name = tensor<string, []>("op_889_cast_fp16")];
            tensor<int32, [4]> var_893_begin_0 = const()[name = tensor<string, []>("op_893_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_893_end_0 = const()[name = tensor<string, []>("op_893_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_893_end_mask_0 = const()[name = tensor<string, []>("op_893_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_893_cast_fp16 = slice_by_index(begin = var_893_begin_0, end = var_893_end_0, end_mask = var_893_end_mask_0, x = query_3_cast_fp16)[name = tensor<string, []>("op_893_cast_fp16")];
            tensor<int32, [4]> var_902_begin_0 = const()[name = tensor<string, []>("op_902_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_902_end_0 = const()[name = tensor<string, []>("op_902_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_902_end_mask_0 = const()[name = tensor<string, []>("op_902_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_902_cast_fp16 = slice_by_index(begin = var_902_begin_0, end = var_902_end_0, end_mask = var_902_end_mask_0, x = var_865_cast_fp16)[name = tensor<string, []>("op_902_cast_fp16")];
            tensor<int32, [4]> var_909_begin_0 = const()[name = tensor<string, []>("op_909_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_909_end_0 = const()[name = tensor<string, []>("op_909_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_909_end_mask_0 = const()[name = tensor<string, []>("op_909_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_909_cast_fp16 = slice_by_index(begin = var_909_begin_0, end = var_909_end_0, end_mask = var_909_end_mask_0, x = var_865_cast_fp16)[name = tensor<string, []>("op_909_cast_fp16")];
            tensor<int32, [4]> var_916_begin_0 = const()[name = tensor<string, []>("op_916_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_916_end_0 = const()[name = tensor<string, []>("op_916_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_916_end_mask_0 = const()[name = tensor<string, []>("op_916_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_916_cast_fp16 = slice_by_index(begin = var_916_begin_0, end = var_916_end_0, end_mask = var_916_end_mask_0, x = var_865_cast_fp16)[name = tensor<string, []>("op_916_cast_fp16")];
            tensor<int32, [4]> var_923_begin_0 = const()[name = tensor<string, []>("op_923_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_923_end_0 = const()[name = tensor<string, []>("op_923_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_923_end_mask_0 = const()[name = tensor<string, []>("op_923_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_923_cast_fp16 = slice_by_index(begin = var_923_begin_0, end = var_923_end_0, end_mask = var_923_end_mask_0, x = var_865_cast_fp16)[name = tensor<string, []>("op_923_cast_fp16")];
            tensor<int32, [4]> var_930_begin_0 = const()[name = tensor<string, []>("op_930_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_930_end_0 = const()[name = tensor<string, []>("op_930_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_930_end_mask_0 = const()[name = tensor<string, []>("op_930_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_930_cast_fp16 = slice_by_index(begin = var_930_begin_0, end = var_930_end_0, end_mask = var_930_end_mask_0, x = var_869_cast_fp16)[name = tensor<string, []>("op_930_cast_fp16")];
            tensor<int32, [4]> var_937_begin_0 = const()[name = tensor<string, []>("op_937_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_937_end_0 = const()[name = tensor<string, []>("op_937_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_937_end_mask_0 = const()[name = tensor<string, []>("op_937_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_937_cast_fp16 = slice_by_index(begin = var_937_begin_0, end = var_937_end_0, end_mask = var_937_end_mask_0, x = var_869_cast_fp16)[name = tensor<string, []>("op_937_cast_fp16")];
            tensor<int32, [4]> var_944_begin_0 = const()[name = tensor<string, []>("op_944_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_944_end_0 = const()[name = tensor<string, []>("op_944_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_944_end_mask_0 = const()[name = tensor<string, []>("op_944_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_944_cast_fp16 = slice_by_index(begin = var_944_begin_0, end = var_944_end_0, end_mask = var_944_end_mask_0, x = var_869_cast_fp16)[name = tensor<string, []>("op_944_cast_fp16")];
            tensor<int32, [4]> var_951_begin_0 = const()[name = tensor<string, []>("op_951_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_951_end_0 = const()[name = tensor<string, []>("op_951_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_951_end_mask_0 = const()[name = tensor<string, []>("op_951_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_951_cast_fp16 = slice_by_index(begin = var_951_begin_0, end = var_951_end_0, end_mask = var_951_end_mask_0, x = var_869_cast_fp16)[name = tensor<string, []>("op_951_cast_fp16")];
            tensor<int32, [4]> var_958_begin_0 = const()[name = tensor<string, []>("op_958_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_958_end_0 = const()[name = tensor<string, []>("op_958_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_958_end_mask_0 = const()[name = tensor<string, []>("op_958_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_958_cast_fp16 = slice_by_index(begin = var_958_begin_0, end = var_958_end_0, end_mask = var_958_end_mask_0, x = var_873_cast_fp16)[name = tensor<string, []>("op_958_cast_fp16")];
            tensor<int32, [4]> var_965_begin_0 = const()[name = tensor<string, []>("op_965_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_965_end_0 = const()[name = tensor<string, []>("op_965_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_965_end_mask_0 = const()[name = tensor<string, []>("op_965_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_965_cast_fp16 = slice_by_index(begin = var_965_begin_0, end = var_965_end_0, end_mask = var_965_end_mask_0, x = var_873_cast_fp16)[name = tensor<string, []>("op_965_cast_fp16")];
            tensor<int32, [4]> var_972_begin_0 = const()[name = tensor<string, []>("op_972_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_972_end_0 = const()[name = tensor<string, []>("op_972_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_972_end_mask_0 = const()[name = tensor<string, []>("op_972_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_972_cast_fp16 = slice_by_index(begin = var_972_begin_0, end = var_972_end_0, end_mask = var_972_end_mask_0, x = var_873_cast_fp16)[name = tensor<string, []>("op_972_cast_fp16")];
            tensor<int32, [4]> var_979_begin_0 = const()[name = tensor<string, []>("op_979_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_979_end_0 = const()[name = tensor<string, []>("op_979_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_979_end_mask_0 = const()[name = tensor<string, []>("op_979_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_979_cast_fp16 = slice_by_index(begin = var_979_begin_0, end = var_979_end_0, end_mask = var_979_end_mask_0, x = var_873_cast_fp16)[name = tensor<string, []>("op_979_cast_fp16")];
            tensor<int32, [4]> var_986_begin_0 = const()[name = tensor<string, []>("op_986_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_986_end_0 = const()[name = tensor<string, []>("op_986_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_986_end_mask_0 = const()[name = tensor<string, []>("op_986_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_986_cast_fp16 = slice_by_index(begin = var_986_begin_0, end = var_986_end_0, end_mask = var_986_end_mask_0, x = var_877_cast_fp16)[name = tensor<string, []>("op_986_cast_fp16")];
            tensor<int32, [4]> var_993_begin_0 = const()[name = tensor<string, []>("op_993_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_993_end_0 = const()[name = tensor<string, []>("op_993_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_993_end_mask_0 = const()[name = tensor<string, []>("op_993_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_993_cast_fp16 = slice_by_index(begin = var_993_begin_0, end = var_993_end_0, end_mask = var_993_end_mask_0, x = var_877_cast_fp16)[name = tensor<string, []>("op_993_cast_fp16")];
            tensor<int32, [4]> var_1000_begin_0 = const()[name = tensor<string, []>("op_1000_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1000_end_0 = const()[name = tensor<string, []>("op_1000_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1000_end_mask_0 = const()[name = tensor<string, []>("op_1000_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1000_cast_fp16 = slice_by_index(begin = var_1000_begin_0, end = var_1000_end_0, end_mask = var_1000_end_mask_0, x = var_877_cast_fp16)[name = tensor<string, []>("op_1000_cast_fp16")];
            tensor<int32, [4]> var_1007_begin_0 = const()[name = tensor<string, []>("op_1007_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1007_end_0 = const()[name = tensor<string, []>("op_1007_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1007_end_mask_0 = const()[name = tensor<string, []>("op_1007_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1007_cast_fp16 = slice_by_index(begin = var_1007_begin_0, end = var_1007_end_0, end_mask = var_1007_end_mask_0, x = var_877_cast_fp16)[name = tensor<string, []>("op_1007_cast_fp16")];
            tensor<int32, [4]> var_1014_begin_0 = const()[name = tensor<string, []>("op_1014_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1014_end_0 = const()[name = tensor<string, []>("op_1014_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1014_end_mask_0 = const()[name = tensor<string, []>("op_1014_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1014_cast_fp16 = slice_by_index(begin = var_1014_begin_0, end = var_1014_end_0, end_mask = var_1014_end_mask_0, x = var_881_cast_fp16)[name = tensor<string, []>("op_1014_cast_fp16")];
            tensor<int32, [4]> var_1021_begin_0 = const()[name = tensor<string, []>("op_1021_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1021_end_0 = const()[name = tensor<string, []>("op_1021_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1021_end_mask_0 = const()[name = tensor<string, []>("op_1021_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1021_cast_fp16 = slice_by_index(begin = var_1021_begin_0, end = var_1021_end_0, end_mask = var_1021_end_mask_0, x = var_881_cast_fp16)[name = tensor<string, []>("op_1021_cast_fp16")];
            tensor<int32, [4]> var_1028_begin_0 = const()[name = tensor<string, []>("op_1028_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1028_end_0 = const()[name = tensor<string, []>("op_1028_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1028_end_mask_0 = const()[name = tensor<string, []>("op_1028_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1028_cast_fp16 = slice_by_index(begin = var_1028_begin_0, end = var_1028_end_0, end_mask = var_1028_end_mask_0, x = var_881_cast_fp16)[name = tensor<string, []>("op_1028_cast_fp16")];
            tensor<int32, [4]> var_1035_begin_0 = const()[name = tensor<string, []>("op_1035_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1035_end_0 = const()[name = tensor<string, []>("op_1035_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1035_end_mask_0 = const()[name = tensor<string, []>("op_1035_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1035_cast_fp16 = slice_by_index(begin = var_1035_begin_0, end = var_1035_end_0, end_mask = var_1035_end_mask_0, x = var_881_cast_fp16)[name = tensor<string, []>("op_1035_cast_fp16")];
            tensor<int32, [4]> var_1042_begin_0 = const()[name = tensor<string, []>("op_1042_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1042_end_0 = const()[name = tensor<string, []>("op_1042_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1042_end_mask_0 = const()[name = tensor<string, []>("op_1042_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1042_cast_fp16 = slice_by_index(begin = var_1042_begin_0, end = var_1042_end_0, end_mask = var_1042_end_mask_0, x = var_885_cast_fp16)[name = tensor<string, []>("op_1042_cast_fp16")];
            tensor<int32, [4]> var_1049_begin_0 = const()[name = tensor<string, []>("op_1049_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1049_end_0 = const()[name = tensor<string, []>("op_1049_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1049_end_mask_0 = const()[name = tensor<string, []>("op_1049_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1049_cast_fp16 = slice_by_index(begin = var_1049_begin_0, end = var_1049_end_0, end_mask = var_1049_end_mask_0, x = var_885_cast_fp16)[name = tensor<string, []>("op_1049_cast_fp16")];
            tensor<int32, [4]> var_1056_begin_0 = const()[name = tensor<string, []>("op_1056_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1056_end_0 = const()[name = tensor<string, []>("op_1056_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1056_end_mask_0 = const()[name = tensor<string, []>("op_1056_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1056_cast_fp16 = slice_by_index(begin = var_1056_begin_0, end = var_1056_end_0, end_mask = var_1056_end_mask_0, x = var_885_cast_fp16)[name = tensor<string, []>("op_1056_cast_fp16")];
            tensor<int32, [4]> var_1063_begin_0 = const()[name = tensor<string, []>("op_1063_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1063_end_0 = const()[name = tensor<string, []>("op_1063_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1063_end_mask_0 = const()[name = tensor<string, []>("op_1063_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1063_cast_fp16 = slice_by_index(begin = var_1063_begin_0, end = var_1063_end_0, end_mask = var_1063_end_mask_0, x = var_885_cast_fp16)[name = tensor<string, []>("op_1063_cast_fp16")];
            tensor<int32, [4]> var_1070_begin_0 = const()[name = tensor<string, []>("op_1070_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1070_end_0 = const()[name = tensor<string, []>("op_1070_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1070_end_mask_0 = const()[name = tensor<string, []>("op_1070_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1070_cast_fp16 = slice_by_index(begin = var_1070_begin_0, end = var_1070_end_0, end_mask = var_1070_end_mask_0, x = var_889_cast_fp16)[name = tensor<string, []>("op_1070_cast_fp16")];
            tensor<int32, [4]> var_1077_begin_0 = const()[name = tensor<string, []>("op_1077_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1077_end_0 = const()[name = tensor<string, []>("op_1077_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1077_end_mask_0 = const()[name = tensor<string, []>("op_1077_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1077_cast_fp16 = slice_by_index(begin = var_1077_begin_0, end = var_1077_end_0, end_mask = var_1077_end_mask_0, x = var_889_cast_fp16)[name = tensor<string, []>("op_1077_cast_fp16")];
            tensor<int32, [4]> var_1084_begin_0 = const()[name = tensor<string, []>("op_1084_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1084_end_0 = const()[name = tensor<string, []>("op_1084_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1084_end_mask_0 = const()[name = tensor<string, []>("op_1084_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1084_cast_fp16 = slice_by_index(begin = var_1084_begin_0, end = var_1084_end_0, end_mask = var_1084_end_mask_0, x = var_889_cast_fp16)[name = tensor<string, []>("op_1084_cast_fp16")];
            tensor<int32, [4]> var_1091_begin_0 = const()[name = tensor<string, []>("op_1091_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1091_end_0 = const()[name = tensor<string, []>("op_1091_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1091_end_mask_0 = const()[name = tensor<string, []>("op_1091_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1091_cast_fp16 = slice_by_index(begin = var_1091_begin_0, end = var_1091_end_0, end_mask = var_1091_end_mask_0, x = var_889_cast_fp16)[name = tensor<string, []>("op_1091_cast_fp16")];
            tensor<int32, [4]> var_1098_begin_0 = const()[name = tensor<string, []>("op_1098_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1098_end_0 = const()[name = tensor<string, []>("op_1098_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1098_end_mask_0 = const()[name = tensor<string, []>("op_1098_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1098_cast_fp16 = slice_by_index(begin = var_1098_begin_0, end = var_1098_end_0, end_mask = var_1098_end_mask_0, x = var_893_cast_fp16)[name = tensor<string, []>("op_1098_cast_fp16")];
            tensor<int32, [4]> var_1105_begin_0 = const()[name = tensor<string, []>("op_1105_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1105_end_0 = const()[name = tensor<string, []>("op_1105_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1105_end_mask_0 = const()[name = tensor<string, []>("op_1105_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1105_cast_fp16 = slice_by_index(begin = var_1105_begin_0, end = var_1105_end_0, end_mask = var_1105_end_mask_0, x = var_893_cast_fp16)[name = tensor<string, []>("op_1105_cast_fp16")];
            tensor<int32, [4]> var_1112_begin_0 = const()[name = tensor<string, []>("op_1112_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1112_end_0 = const()[name = tensor<string, []>("op_1112_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1112_end_mask_0 = const()[name = tensor<string, []>("op_1112_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1112_cast_fp16 = slice_by_index(begin = var_1112_begin_0, end = var_1112_end_0, end_mask = var_1112_end_mask_0, x = var_893_cast_fp16)[name = tensor<string, []>("op_1112_cast_fp16")];
            tensor<int32, [4]> var_1119_begin_0 = const()[name = tensor<string, []>("op_1119_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1119_end_0 = const()[name = tensor<string, []>("op_1119_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1119_end_mask_0 = const()[name = tensor<string, []>("op_1119_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1119_cast_fp16 = slice_by_index(begin = var_1119_begin_0, end = var_1119_end_0, end_mask = var_1119_end_mask_0, x = var_893_cast_fp16)[name = tensor<string, []>("op_1119_cast_fp16")];
            tensor<int32, [4]> k_3_perm_0 = const()[name = tensor<string, []>("k_3_perm_0"), val = tensor<int32, [4]>([0, 3, 2, 1])];
            tensor<int32, [4]> var_1124_begin_0 = const()[name = tensor<string, []>("op_1124_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1124_end_0 = const()[name = tensor<string, []>("op_1124_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 64])];
            tensor<bool, [4]> var_1124_end_mask_0 = const()[name = tensor<string, []>("op_1124_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 512]> transpose_4 = transpose(perm = k_3_perm_0, x = key_3_cast_fp16)[name = tensor<string, []>("transpose_4")];
            tensor<fp16, [1, 1500, 1, 64]> var_1124_cast_fp16 = slice_by_index(begin = var_1124_begin_0, end = var_1124_end_0, end_mask = var_1124_end_mask_0, x = transpose_4)[name = tensor<string, []>("op_1124_cast_fp16")];
            tensor<int32, [4]> var_1128_begin_0 = const()[name = tensor<string, []>("op_1128_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 64])];
            tensor<int32, [4]> var_1128_end_0 = const()[name = tensor<string, []>("op_1128_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 128])];
            tensor<bool, [4]> var_1128_end_mask_0 = const()[name = tensor<string, []>("op_1128_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1128_cast_fp16 = slice_by_index(begin = var_1128_begin_0, end = var_1128_end_0, end_mask = var_1128_end_mask_0, x = transpose_4)[name = tensor<string, []>("op_1128_cast_fp16")];
            tensor<int32, [4]> var_1132_begin_0 = const()[name = tensor<string, []>("op_1132_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 128])];
            tensor<int32, [4]> var_1132_end_0 = const()[name = tensor<string, []>("op_1132_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 192])];
            tensor<bool, [4]> var_1132_end_mask_0 = const()[name = tensor<string, []>("op_1132_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1132_cast_fp16 = slice_by_index(begin = var_1132_begin_0, end = var_1132_end_0, end_mask = var_1132_end_mask_0, x = transpose_4)[name = tensor<string, []>("op_1132_cast_fp16")];
            tensor<int32, [4]> var_1136_begin_0 = const()[name = tensor<string, []>("op_1136_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 192])];
            tensor<int32, [4]> var_1136_end_0 = const()[name = tensor<string, []>("op_1136_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 256])];
            tensor<bool, [4]> var_1136_end_mask_0 = const()[name = tensor<string, []>("op_1136_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1136_cast_fp16 = slice_by_index(begin = var_1136_begin_0, end = var_1136_end_0, end_mask = var_1136_end_mask_0, x = transpose_4)[name = tensor<string, []>("op_1136_cast_fp16")];
            tensor<int32, [4]> var_1140_begin_0 = const()[name = tensor<string, []>("op_1140_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 256])];
            tensor<int32, [4]> var_1140_end_0 = const()[name = tensor<string, []>("op_1140_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 320])];
            tensor<bool, [4]> var_1140_end_mask_0 = const()[name = tensor<string, []>("op_1140_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1140_cast_fp16 = slice_by_index(begin = var_1140_begin_0, end = var_1140_end_0, end_mask = var_1140_end_mask_0, x = transpose_4)[name = tensor<string, []>("op_1140_cast_fp16")];
            tensor<int32, [4]> var_1144_begin_0 = const()[name = tensor<string, []>("op_1144_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 320])];
            tensor<int32, [4]> var_1144_end_0 = const()[name = tensor<string, []>("op_1144_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 384])];
            tensor<bool, [4]> var_1144_end_mask_0 = const()[name = tensor<string, []>("op_1144_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1144_cast_fp16 = slice_by_index(begin = var_1144_begin_0, end = var_1144_end_0, end_mask = var_1144_end_mask_0, x = transpose_4)[name = tensor<string, []>("op_1144_cast_fp16")];
            tensor<int32, [4]> var_1148_begin_0 = const()[name = tensor<string, []>("op_1148_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 384])];
            tensor<int32, [4]> var_1148_end_0 = const()[name = tensor<string, []>("op_1148_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 448])];
            tensor<bool, [4]> var_1148_end_mask_0 = const()[name = tensor<string, []>("op_1148_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1148_cast_fp16 = slice_by_index(begin = var_1148_begin_0, end = var_1148_end_0, end_mask = var_1148_end_mask_0, x = transpose_4)[name = tensor<string, []>("op_1148_cast_fp16")];
            tensor<int32, [4]> var_1152_begin_0 = const()[name = tensor<string, []>("op_1152_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 448])];
            tensor<int32, [4]> var_1152_end_0 = const()[name = tensor<string, []>("op_1152_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 512])];
            tensor<bool, [4]> var_1152_end_mask_0 = const()[name = tensor<string, []>("op_1152_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1152_cast_fp16 = slice_by_index(begin = var_1152_begin_0, end = var_1152_end_0, end_mask = var_1152_end_mask_0, x = transpose_4)[name = tensor<string, []>("op_1152_cast_fp16")];
            tensor<int32, [4]> var_1154_begin_0 = const()[name = tensor<string, []>("op_1154_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1154_end_0 = const()[name = tensor<string, []>("op_1154_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1154_end_mask_0 = const()[name = tensor<string, []>("op_1154_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1154_cast_fp16 = slice_by_index(begin = var_1154_begin_0, end = var_1154_end_0, end_mask = var_1154_end_mask_0, x = value_3_cast_fp16)[name = tensor<string, []>("op_1154_cast_fp16")];
            tensor<int32, [4]> var_1158_begin_0 = const()[name = tensor<string, []>("op_1158_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_1158_end_0 = const()[name = tensor<string, []>("op_1158_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_1158_end_mask_0 = const()[name = tensor<string, []>("op_1158_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1158_cast_fp16 = slice_by_index(begin = var_1158_begin_0, end = var_1158_end_0, end_mask = var_1158_end_mask_0, x = value_3_cast_fp16)[name = tensor<string, []>("op_1158_cast_fp16")];
            tensor<int32, [4]> var_1162_begin_0 = const()[name = tensor<string, []>("op_1162_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_1162_end_0 = const()[name = tensor<string, []>("op_1162_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_1162_end_mask_0 = const()[name = tensor<string, []>("op_1162_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1162_cast_fp16 = slice_by_index(begin = var_1162_begin_0, end = var_1162_end_0, end_mask = var_1162_end_mask_0, x = value_3_cast_fp16)[name = tensor<string, []>("op_1162_cast_fp16")];
            tensor<int32, [4]> var_1166_begin_0 = const()[name = tensor<string, []>("op_1166_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_1166_end_0 = const()[name = tensor<string, []>("op_1166_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_1166_end_mask_0 = const()[name = tensor<string, []>("op_1166_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1166_cast_fp16 = slice_by_index(begin = var_1166_begin_0, end = var_1166_end_0, end_mask = var_1166_end_mask_0, x = value_3_cast_fp16)[name = tensor<string, []>("op_1166_cast_fp16")];
            tensor<int32, [4]> var_1170_begin_0 = const()[name = tensor<string, []>("op_1170_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_1170_end_0 = const()[name = tensor<string, []>("op_1170_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_1170_end_mask_0 = const()[name = tensor<string, []>("op_1170_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1170_cast_fp16 = slice_by_index(begin = var_1170_begin_0, end = var_1170_end_0, end_mask = var_1170_end_mask_0, x = value_3_cast_fp16)[name = tensor<string, []>("op_1170_cast_fp16")];
            tensor<int32, [4]> var_1174_begin_0 = const()[name = tensor<string, []>("op_1174_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_1174_end_0 = const()[name = tensor<string, []>("op_1174_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_1174_end_mask_0 = const()[name = tensor<string, []>("op_1174_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1174_cast_fp16 = slice_by_index(begin = var_1174_begin_0, end = var_1174_end_0, end_mask = var_1174_end_mask_0, x = value_3_cast_fp16)[name = tensor<string, []>("op_1174_cast_fp16")];
            tensor<int32, [4]> var_1178_begin_0 = const()[name = tensor<string, []>("op_1178_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_1178_end_0 = const()[name = tensor<string, []>("op_1178_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_1178_end_mask_0 = const()[name = tensor<string, []>("op_1178_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1178_cast_fp16 = slice_by_index(begin = var_1178_begin_0, end = var_1178_end_0, end_mask = var_1178_end_mask_0, x = value_3_cast_fp16)[name = tensor<string, []>("op_1178_cast_fp16")];
            tensor<int32, [4]> var_1182_begin_0 = const()[name = tensor<string, []>("op_1182_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_1182_end_0 = const()[name = tensor<string, []>("op_1182_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_1182_end_mask_0 = const()[name = tensor<string, []>("op_1182_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1182_cast_fp16 = slice_by_index(begin = var_1182_begin_0, end = var_1182_end_0, end_mask = var_1182_end_mask_0, x = value_3_cast_fp16)[name = tensor<string, []>("op_1182_cast_fp16")];
            tensor<string, []> var_1186_equation_0 = const()[name = tensor<string, []>("op_1186_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1186_cast_fp16 = einsum(equation = var_1186_equation_0, values = (var_1124_cast_fp16, var_902_cast_fp16))[name = tensor<string, []>("op_1186_cast_fp16")];
            tensor<fp16, []> var_1187_to_fp16 = const()[name = tensor<string, []>("op_1187_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_65_cast_fp16 = mul(x = var_1186_cast_fp16, y = var_1187_to_fp16)[name = tensor<string, []>("aw_chunk_65_cast_fp16")];
            tensor<string, []> var_1190_equation_0 = const()[name = tensor<string, []>("op_1190_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1190_cast_fp16 = einsum(equation = var_1190_equation_0, values = (var_1124_cast_fp16, var_909_cast_fp16))[name = tensor<string, []>("op_1190_cast_fp16")];
            tensor<fp16, []> var_1191_to_fp16 = const()[name = tensor<string, []>("op_1191_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_67_cast_fp16 = mul(x = var_1190_cast_fp16, y = var_1191_to_fp16)[name = tensor<string, []>("aw_chunk_67_cast_fp16")];
            tensor<string, []> var_1194_equation_0 = const()[name = tensor<string, []>("op_1194_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1194_cast_fp16 = einsum(equation = var_1194_equation_0, values = (var_1124_cast_fp16, var_916_cast_fp16))[name = tensor<string, []>("op_1194_cast_fp16")];
            tensor<fp16, []> var_1195_to_fp16 = const()[name = tensor<string, []>("op_1195_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_69_cast_fp16 = mul(x = var_1194_cast_fp16, y = var_1195_to_fp16)[name = tensor<string, []>("aw_chunk_69_cast_fp16")];
            tensor<string, []> var_1198_equation_0 = const()[name = tensor<string, []>("op_1198_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1198_cast_fp16 = einsum(equation = var_1198_equation_0, values = (var_1124_cast_fp16, var_923_cast_fp16))[name = tensor<string, []>("op_1198_cast_fp16")];
            tensor<fp16, []> var_1199_to_fp16 = const()[name = tensor<string, []>("op_1199_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_71_cast_fp16 = mul(x = var_1198_cast_fp16, y = var_1199_to_fp16)[name = tensor<string, []>("aw_chunk_71_cast_fp16")];
            tensor<string, []> var_1202_equation_0 = const()[name = tensor<string, []>("op_1202_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1202_cast_fp16 = einsum(equation = var_1202_equation_0, values = (var_1128_cast_fp16, var_930_cast_fp16))[name = tensor<string, []>("op_1202_cast_fp16")];
            tensor<fp16, []> var_1203_to_fp16 = const()[name = tensor<string, []>("op_1203_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_73_cast_fp16 = mul(x = var_1202_cast_fp16, y = var_1203_to_fp16)[name = tensor<string, []>("aw_chunk_73_cast_fp16")];
            tensor<string, []> var_1206_equation_0 = const()[name = tensor<string, []>("op_1206_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1206_cast_fp16 = einsum(equation = var_1206_equation_0, values = (var_1128_cast_fp16, var_937_cast_fp16))[name = tensor<string, []>("op_1206_cast_fp16")];
            tensor<fp16, []> var_1207_to_fp16 = const()[name = tensor<string, []>("op_1207_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_75_cast_fp16 = mul(x = var_1206_cast_fp16, y = var_1207_to_fp16)[name = tensor<string, []>("aw_chunk_75_cast_fp16")];
            tensor<string, []> var_1210_equation_0 = const()[name = tensor<string, []>("op_1210_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1210_cast_fp16 = einsum(equation = var_1210_equation_0, values = (var_1128_cast_fp16, var_944_cast_fp16))[name = tensor<string, []>("op_1210_cast_fp16")];
            tensor<fp16, []> var_1211_to_fp16 = const()[name = tensor<string, []>("op_1211_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_77_cast_fp16 = mul(x = var_1210_cast_fp16, y = var_1211_to_fp16)[name = tensor<string, []>("aw_chunk_77_cast_fp16")];
            tensor<string, []> var_1214_equation_0 = const()[name = tensor<string, []>("op_1214_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1214_cast_fp16 = einsum(equation = var_1214_equation_0, values = (var_1128_cast_fp16, var_951_cast_fp16))[name = tensor<string, []>("op_1214_cast_fp16")];
            tensor<fp16, []> var_1215_to_fp16 = const()[name = tensor<string, []>("op_1215_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_79_cast_fp16 = mul(x = var_1214_cast_fp16, y = var_1215_to_fp16)[name = tensor<string, []>("aw_chunk_79_cast_fp16")];
            tensor<string, []> var_1218_equation_0 = const()[name = tensor<string, []>("op_1218_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1218_cast_fp16 = einsum(equation = var_1218_equation_0, values = (var_1132_cast_fp16, var_958_cast_fp16))[name = tensor<string, []>("op_1218_cast_fp16")];
            tensor<fp16, []> var_1219_to_fp16 = const()[name = tensor<string, []>("op_1219_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_81_cast_fp16 = mul(x = var_1218_cast_fp16, y = var_1219_to_fp16)[name = tensor<string, []>("aw_chunk_81_cast_fp16")];
            tensor<string, []> var_1222_equation_0 = const()[name = tensor<string, []>("op_1222_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1222_cast_fp16 = einsum(equation = var_1222_equation_0, values = (var_1132_cast_fp16, var_965_cast_fp16))[name = tensor<string, []>("op_1222_cast_fp16")];
            tensor<fp16, []> var_1223_to_fp16 = const()[name = tensor<string, []>("op_1223_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_83_cast_fp16 = mul(x = var_1222_cast_fp16, y = var_1223_to_fp16)[name = tensor<string, []>("aw_chunk_83_cast_fp16")];
            tensor<string, []> var_1226_equation_0 = const()[name = tensor<string, []>("op_1226_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1226_cast_fp16 = einsum(equation = var_1226_equation_0, values = (var_1132_cast_fp16, var_972_cast_fp16))[name = tensor<string, []>("op_1226_cast_fp16")];
            tensor<fp16, []> var_1227_to_fp16 = const()[name = tensor<string, []>("op_1227_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_85_cast_fp16 = mul(x = var_1226_cast_fp16, y = var_1227_to_fp16)[name = tensor<string, []>("aw_chunk_85_cast_fp16")];
            tensor<string, []> var_1230_equation_0 = const()[name = tensor<string, []>("op_1230_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1230_cast_fp16 = einsum(equation = var_1230_equation_0, values = (var_1132_cast_fp16, var_979_cast_fp16))[name = tensor<string, []>("op_1230_cast_fp16")];
            tensor<fp16, []> var_1231_to_fp16 = const()[name = tensor<string, []>("op_1231_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_87_cast_fp16 = mul(x = var_1230_cast_fp16, y = var_1231_to_fp16)[name = tensor<string, []>("aw_chunk_87_cast_fp16")];
            tensor<string, []> var_1234_equation_0 = const()[name = tensor<string, []>("op_1234_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1234_cast_fp16 = einsum(equation = var_1234_equation_0, values = (var_1136_cast_fp16, var_986_cast_fp16))[name = tensor<string, []>("op_1234_cast_fp16")];
            tensor<fp16, []> var_1235_to_fp16 = const()[name = tensor<string, []>("op_1235_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_89_cast_fp16 = mul(x = var_1234_cast_fp16, y = var_1235_to_fp16)[name = tensor<string, []>("aw_chunk_89_cast_fp16")];
            tensor<string, []> var_1238_equation_0 = const()[name = tensor<string, []>("op_1238_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1238_cast_fp16 = einsum(equation = var_1238_equation_0, values = (var_1136_cast_fp16, var_993_cast_fp16))[name = tensor<string, []>("op_1238_cast_fp16")];
            tensor<fp16, []> var_1239_to_fp16 = const()[name = tensor<string, []>("op_1239_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_91_cast_fp16 = mul(x = var_1238_cast_fp16, y = var_1239_to_fp16)[name = tensor<string, []>("aw_chunk_91_cast_fp16")];
            tensor<string, []> var_1242_equation_0 = const()[name = tensor<string, []>("op_1242_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1242_cast_fp16 = einsum(equation = var_1242_equation_0, values = (var_1136_cast_fp16, var_1000_cast_fp16))[name = tensor<string, []>("op_1242_cast_fp16")];
            tensor<fp16, []> var_1243_to_fp16 = const()[name = tensor<string, []>("op_1243_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_93_cast_fp16 = mul(x = var_1242_cast_fp16, y = var_1243_to_fp16)[name = tensor<string, []>("aw_chunk_93_cast_fp16")];
            tensor<string, []> var_1246_equation_0 = const()[name = tensor<string, []>("op_1246_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1246_cast_fp16 = einsum(equation = var_1246_equation_0, values = (var_1136_cast_fp16, var_1007_cast_fp16))[name = tensor<string, []>("op_1246_cast_fp16")];
            tensor<fp16, []> var_1247_to_fp16 = const()[name = tensor<string, []>("op_1247_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_95_cast_fp16 = mul(x = var_1246_cast_fp16, y = var_1247_to_fp16)[name = tensor<string, []>("aw_chunk_95_cast_fp16")];
            tensor<string, []> var_1250_equation_0 = const()[name = tensor<string, []>("op_1250_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1250_cast_fp16 = einsum(equation = var_1250_equation_0, values = (var_1140_cast_fp16, var_1014_cast_fp16))[name = tensor<string, []>("op_1250_cast_fp16")];
            tensor<fp16, []> var_1251_to_fp16 = const()[name = tensor<string, []>("op_1251_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_97_cast_fp16 = mul(x = var_1250_cast_fp16, y = var_1251_to_fp16)[name = tensor<string, []>("aw_chunk_97_cast_fp16")];
            tensor<string, []> var_1254_equation_0 = const()[name = tensor<string, []>("op_1254_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1254_cast_fp16 = einsum(equation = var_1254_equation_0, values = (var_1140_cast_fp16, var_1021_cast_fp16))[name = tensor<string, []>("op_1254_cast_fp16")];
            tensor<fp16, []> var_1255_to_fp16 = const()[name = tensor<string, []>("op_1255_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_99_cast_fp16 = mul(x = var_1254_cast_fp16, y = var_1255_to_fp16)[name = tensor<string, []>("aw_chunk_99_cast_fp16")];
            tensor<string, []> var_1258_equation_0 = const()[name = tensor<string, []>("op_1258_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1258_cast_fp16 = einsum(equation = var_1258_equation_0, values = (var_1140_cast_fp16, var_1028_cast_fp16))[name = tensor<string, []>("op_1258_cast_fp16")];
            tensor<fp16, []> var_1259_to_fp16 = const()[name = tensor<string, []>("op_1259_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_101_cast_fp16 = mul(x = var_1258_cast_fp16, y = var_1259_to_fp16)[name = tensor<string, []>("aw_chunk_101_cast_fp16")];
            tensor<string, []> var_1262_equation_0 = const()[name = tensor<string, []>("op_1262_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1262_cast_fp16 = einsum(equation = var_1262_equation_0, values = (var_1140_cast_fp16, var_1035_cast_fp16))[name = tensor<string, []>("op_1262_cast_fp16")];
            tensor<fp16, []> var_1263_to_fp16 = const()[name = tensor<string, []>("op_1263_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_103_cast_fp16 = mul(x = var_1262_cast_fp16, y = var_1263_to_fp16)[name = tensor<string, []>("aw_chunk_103_cast_fp16")];
            tensor<string, []> var_1266_equation_0 = const()[name = tensor<string, []>("op_1266_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1266_cast_fp16 = einsum(equation = var_1266_equation_0, values = (var_1144_cast_fp16, var_1042_cast_fp16))[name = tensor<string, []>("op_1266_cast_fp16")];
            tensor<fp16, []> var_1267_to_fp16 = const()[name = tensor<string, []>("op_1267_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_105_cast_fp16 = mul(x = var_1266_cast_fp16, y = var_1267_to_fp16)[name = tensor<string, []>("aw_chunk_105_cast_fp16")];
            tensor<string, []> var_1270_equation_0 = const()[name = tensor<string, []>("op_1270_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1270_cast_fp16 = einsum(equation = var_1270_equation_0, values = (var_1144_cast_fp16, var_1049_cast_fp16))[name = tensor<string, []>("op_1270_cast_fp16")];
            tensor<fp16, []> var_1271_to_fp16 = const()[name = tensor<string, []>("op_1271_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_107_cast_fp16 = mul(x = var_1270_cast_fp16, y = var_1271_to_fp16)[name = tensor<string, []>("aw_chunk_107_cast_fp16")];
            tensor<string, []> var_1274_equation_0 = const()[name = tensor<string, []>("op_1274_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1274_cast_fp16 = einsum(equation = var_1274_equation_0, values = (var_1144_cast_fp16, var_1056_cast_fp16))[name = tensor<string, []>("op_1274_cast_fp16")];
            tensor<fp16, []> var_1275_to_fp16 = const()[name = tensor<string, []>("op_1275_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_109_cast_fp16 = mul(x = var_1274_cast_fp16, y = var_1275_to_fp16)[name = tensor<string, []>("aw_chunk_109_cast_fp16")];
            tensor<string, []> var_1278_equation_0 = const()[name = tensor<string, []>("op_1278_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1278_cast_fp16 = einsum(equation = var_1278_equation_0, values = (var_1144_cast_fp16, var_1063_cast_fp16))[name = tensor<string, []>("op_1278_cast_fp16")];
            tensor<fp16, []> var_1279_to_fp16 = const()[name = tensor<string, []>("op_1279_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_111_cast_fp16 = mul(x = var_1278_cast_fp16, y = var_1279_to_fp16)[name = tensor<string, []>("aw_chunk_111_cast_fp16")];
            tensor<string, []> var_1282_equation_0 = const()[name = tensor<string, []>("op_1282_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1282_cast_fp16 = einsum(equation = var_1282_equation_0, values = (var_1148_cast_fp16, var_1070_cast_fp16))[name = tensor<string, []>("op_1282_cast_fp16")];
            tensor<fp16, []> var_1283_to_fp16 = const()[name = tensor<string, []>("op_1283_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_113_cast_fp16 = mul(x = var_1282_cast_fp16, y = var_1283_to_fp16)[name = tensor<string, []>("aw_chunk_113_cast_fp16")];
            tensor<string, []> var_1286_equation_0 = const()[name = tensor<string, []>("op_1286_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1286_cast_fp16 = einsum(equation = var_1286_equation_0, values = (var_1148_cast_fp16, var_1077_cast_fp16))[name = tensor<string, []>("op_1286_cast_fp16")];
            tensor<fp16, []> var_1287_to_fp16 = const()[name = tensor<string, []>("op_1287_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_115_cast_fp16 = mul(x = var_1286_cast_fp16, y = var_1287_to_fp16)[name = tensor<string, []>("aw_chunk_115_cast_fp16")];
            tensor<string, []> var_1290_equation_0 = const()[name = tensor<string, []>("op_1290_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1290_cast_fp16 = einsum(equation = var_1290_equation_0, values = (var_1148_cast_fp16, var_1084_cast_fp16))[name = tensor<string, []>("op_1290_cast_fp16")];
            tensor<fp16, []> var_1291_to_fp16 = const()[name = tensor<string, []>("op_1291_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_117_cast_fp16 = mul(x = var_1290_cast_fp16, y = var_1291_to_fp16)[name = tensor<string, []>("aw_chunk_117_cast_fp16")];
            tensor<string, []> var_1294_equation_0 = const()[name = tensor<string, []>("op_1294_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1294_cast_fp16 = einsum(equation = var_1294_equation_0, values = (var_1148_cast_fp16, var_1091_cast_fp16))[name = tensor<string, []>("op_1294_cast_fp16")];
            tensor<fp16, []> var_1295_to_fp16 = const()[name = tensor<string, []>("op_1295_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_119_cast_fp16 = mul(x = var_1294_cast_fp16, y = var_1295_to_fp16)[name = tensor<string, []>("aw_chunk_119_cast_fp16")];
            tensor<string, []> var_1298_equation_0 = const()[name = tensor<string, []>("op_1298_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1298_cast_fp16 = einsum(equation = var_1298_equation_0, values = (var_1152_cast_fp16, var_1098_cast_fp16))[name = tensor<string, []>("op_1298_cast_fp16")];
            tensor<fp16, []> var_1299_to_fp16 = const()[name = tensor<string, []>("op_1299_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_121_cast_fp16 = mul(x = var_1298_cast_fp16, y = var_1299_to_fp16)[name = tensor<string, []>("aw_chunk_121_cast_fp16")];
            tensor<string, []> var_1302_equation_0 = const()[name = tensor<string, []>("op_1302_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1302_cast_fp16 = einsum(equation = var_1302_equation_0, values = (var_1152_cast_fp16, var_1105_cast_fp16))[name = tensor<string, []>("op_1302_cast_fp16")];
            tensor<fp16, []> var_1303_to_fp16 = const()[name = tensor<string, []>("op_1303_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_123_cast_fp16 = mul(x = var_1302_cast_fp16, y = var_1303_to_fp16)[name = tensor<string, []>("aw_chunk_123_cast_fp16")];
            tensor<string, []> var_1306_equation_0 = const()[name = tensor<string, []>("op_1306_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1306_cast_fp16 = einsum(equation = var_1306_equation_0, values = (var_1152_cast_fp16, var_1112_cast_fp16))[name = tensor<string, []>("op_1306_cast_fp16")];
            tensor<fp16, []> var_1307_to_fp16 = const()[name = tensor<string, []>("op_1307_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_125_cast_fp16 = mul(x = var_1306_cast_fp16, y = var_1307_to_fp16)[name = tensor<string, []>("aw_chunk_125_cast_fp16")];
            tensor<string, []> var_1310_equation_0 = const()[name = tensor<string, []>("op_1310_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1310_cast_fp16 = einsum(equation = var_1310_equation_0, values = (var_1152_cast_fp16, var_1119_cast_fp16))[name = tensor<string, []>("op_1310_cast_fp16")];
            tensor<fp16, []> var_1311_to_fp16 = const()[name = tensor<string, []>("op_1311_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_127_cast_fp16 = mul(x = var_1310_cast_fp16, y = var_1311_to_fp16)[name = tensor<string, []>("aw_chunk_127_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1313_cast_fp16 = softmax(axis = var_810, x = aw_chunk_65_cast_fp16)[name = tensor<string, []>("op_1313_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1314_cast_fp16 = softmax(axis = var_810, x = aw_chunk_67_cast_fp16)[name = tensor<string, []>("op_1314_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1315_cast_fp16 = softmax(axis = var_810, x = aw_chunk_69_cast_fp16)[name = tensor<string, []>("op_1315_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1316_cast_fp16 = softmax(axis = var_810, x = aw_chunk_71_cast_fp16)[name = tensor<string, []>("op_1316_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1317_cast_fp16 = softmax(axis = var_810, x = aw_chunk_73_cast_fp16)[name = tensor<string, []>("op_1317_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1318_cast_fp16 = softmax(axis = var_810, x = aw_chunk_75_cast_fp16)[name = tensor<string, []>("op_1318_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1319_cast_fp16 = softmax(axis = var_810, x = aw_chunk_77_cast_fp16)[name = tensor<string, []>("op_1319_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1320_cast_fp16 = softmax(axis = var_810, x = aw_chunk_79_cast_fp16)[name = tensor<string, []>("op_1320_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1321_cast_fp16 = softmax(axis = var_810, x = aw_chunk_81_cast_fp16)[name = tensor<string, []>("op_1321_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1322_cast_fp16 = softmax(axis = var_810, x = aw_chunk_83_cast_fp16)[name = tensor<string, []>("op_1322_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1323_cast_fp16 = softmax(axis = var_810, x = aw_chunk_85_cast_fp16)[name = tensor<string, []>("op_1323_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1324_cast_fp16 = softmax(axis = var_810, x = aw_chunk_87_cast_fp16)[name = tensor<string, []>("op_1324_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1325_cast_fp16 = softmax(axis = var_810, x = aw_chunk_89_cast_fp16)[name = tensor<string, []>("op_1325_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1326_cast_fp16 = softmax(axis = var_810, x = aw_chunk_91_cast_fp16)[name = tensor<string, []>("op_1326_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1327_cast_fp16 = softmax(axis = var_810, x = aw_chunk_93_cast_fp16)[name = tensor<string, []>("op_1327_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1328_cast_fp16 = softmax(axis = var_810, x = aw_chunk_95_cast_fp16)[name = tensor<string, []>("op_1328_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1329_cast_fp16 = softmax(axis = var_810, x = aw_chunk_97_cast_fp16)[name = tensor<string, []>("op_1329_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1330_cast_fp16 = softmax(axis = var_810, x = aw_chunk_99_cast_fp16)[name = tensor<string, []>("op_1330_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1331_cast_fp16 = softmax(axis = var_810, x = aw_chunk_101_cast_fp16)[name = tensor<string, []>("op_1331_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1332_cast_fp16 = softmax(axis = var_810, x = aw_chunk_103_cast_fp16)[name = tensor<string, []>("op_1332_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1333_cast_fp16 = softmax(axis = var_810, x = aw_chunk_105_cast_fp16)[name = tensor<string, []>("op_1333_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1334_cast_fp16 = softmax(axis = var_810, x = aw_chunk_107_cast_fp16)[name = tensor<string, []>("op_1334_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1335_cast_fp16 = softmax(axis = var_810, x = aw_chunk_109_cast_fp16)[name = tensor<string, []>("op_1335_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1336_cast_fp16 = softmax(axis = var_810, x = aw_chunk_111_cast_fp16)[name = tensor<string, []>("op_1336_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1337_cast_fp16 = softmax(axis = var_810, x = aw_chunk_113_cast_fp16)[name = tensor<string, []>("op_1337_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1338_cast_fp16 = softmax(axis = var_810, x = aw_chunk_115_cast_fp16)[name = tensor<string, []>("op_1338_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1339_cast_fp16 = softmax(axis = var_810, x = aw_chunk_117_cast_fp16)[name = tensor<string, []>("op_1339_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1340_cast_fp16 = softmax(axis = var_810, x = aw_chunk_119_cast_fp16)[name = tensor<string, []>("op_1340_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1341_cast_fp16 = softmax(axis = var_810, x = aw_chunk_121_cast_fp16)[name = tensor<string, []>("op_1341_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1342_cast_fp16 = softmax(axis = var_810, x = aw_chunk_123_cast_fp16)[name = tensor<string, []>("op_1342_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1343_cast_fp16 = softmax(axis = var_810, x = aw_chunk_125_cast_fp16)[name = tensor<string, []>("op_1343_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1344_cast_fp16 = softmax(axis = var_810, x = aw_chunk_127_cast_fp16)[name = tensor<string, []>("op_1344_cast_fp16")];
            tensor<string, []> var_1346_equation_0 = const()[name = tensor<string, []>("op_1346_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1346_cast_fp16 = einsum(equation = var_1346_equation_0, values = (var_1154_cast_fp16, var_1313_cast_fp16))[name = tensor<string, []>("op_1346_cast_fp16")];
            tensor<string, []> var_1348_equation_0 = const()[name = tensor<string, []>("op_1348_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1348_cast_fp16 = einsum(equation = var_1348_equation_0, values = (var_1154_cast_fp16, var_1314_cast_fp16))[name = tensor<string, []>("op_1348_cast_fp16")];
            tensor<string, []> var_1350_equation_0 = const()[name = tensor<string, []>("op_1350_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1350_cast_fp16 = einsum(equation = var_1350_equation_0, values = (var_1154_cast_fp16, var_1315_cast_fp16))[name = tensor<string, []>("op_1350_cast_fp16")];
            tensor<string, []> var_1352_equation_0 = const()[name = tensor<string, []>("op_1352_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1352_cast_fp16 = einsum(equation = var_1352_equation_0, values = (var_1154_cast_fp16, var_1316_cast_fp16))[name = tensor<string, []>("op_1352_cast_fp16")];
            tensor<string, []> var_1354_equation_0 = const()[name = tensor<string, []>("op_1354_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1354_cast_fp16 = einsum(equation = var_1354_equation_0, values = (var_1158_cast_fp16, var_1317_cast_fp16))[name = tensor<string, []>("op_1354_cast_fp16")];
            tensor<string, []> var_1356_equation_0 = const()[name = tensor<string, []>("op_1356_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1356_cast_fp16 = einsum(equation = var_1356_equation_0, values = (var_1158_cast_fp16, var_1318_cast_fp16))[name = tensor<string, []>("op_1356_cast_fp16")];
            tensor<string, []> var_1358_equation_0 = const()[name = tensor<string, []>("op_1358_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1358_cast_fp16 = einsum(equation = var_1358_equation_0, values = (var_1158_cast_fp16, var_1319_cast_fp16))[name = tensor<string, []>("op_1358_cast_fp16")];
            tensor<string, []> var_1360_equation_0 = const()[name = tensor<string, []>("op_1360_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1360_cast_fp16 = einsum(equation = var_1360_equation_0, values = (var_1158_cast_fp16, var_1320_cast_fp16))[name = tensor<string, []>("op_1360_cast_fp16")];
            tensor<string, []> var_1362_equation_0 = const()[name = tensor<string, []>("op_1362_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1362_cast_fp16 = einsum(equation = var_1362_equation_0, values = (var_1162_cast_fp16, var_1321_cast_fp16))[name = tensor<string, []>("op_1362_cast_fp16")];
            tensor<string, []> var_1364_equation_0 = const()[name = tensor<string, []>("op_1364_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1364_cast_fp16 = einsum(equation = var_1364_equation_0, values = (var_1162_cast_fp16, var_1322_cast_fp16))[name = tensor<string, []>("op_1364_cast_fp16")];
            tensor<string, []> var_1366_equation_0 = const()[name = tensor<string, []>("op_1366_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1366_cast_fp16 = einsum(equation = var_1366_equation_0, values = (var_1162_cast_fp16, var_1323_cast_fp16))[name = tensor<string, []>("op_1366_cast_fp16")];
            tensor<string, []> var_1368_equation_0 = const()[name = tensor<string, []>("op_1368_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1368_cast_fp16 = einsum(equation = var_1368_equation_0, values = (var_1162_cast_fp16, var_1324_cast_fp16))[name = tensor<string, []>("op_1368_cast_fp16")];
            tensor<string, []> var_1370_equation_0 = const()[name = tensor<string, []>("op_1370_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1370_cast_fp16 = einsum(equation = var_1370_equation_0, values = (var_1166_cast_fp16, var_1325_cast_fp16))[name = tensor<string, []>("op_1370_cast_fp16")];
            tensor<string, []> var_1372_equation_0 = const()[name = tensor<string, []>("op_1372_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1372_cast_fp16 = einsum(equation = var_1372_equation_0, values = (var_1166_cast_fp16, var_1326_cast_fp16))[name = tensor<string, []>("op_1372_cast_fp16")];
            tensor<string, []> var_1374_equation_0 = const()[name = tensor<string, []>("op_1374_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1374_cast_fp16 = einsum(equation = var_1374_equation_0, values = (var_1166_cast_fp16, var_1327_cast_fp16))[name = tensor<string, []>("op_1374_cast_fp16")];
            tensor<string, []> var_1376_equation_0 = const()[name = tensor<string, []>("op_1376_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1376_cast_fp16 = einsum(equation = var_1376_equation_0, values = (var_1166_cast_fp16, var_1328_cast_fp16))[name = tensor<string, []>("op_1376_cast_fp16")];
            tensor<string, []> var_1378_equation_0 = const()[name = tensor<string, []>("op_1378_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1378_cast_fp16 = einsum(equation = var_1378_equation_0, values = (var_1170_cast_fp16, var_1329_cast_fp16))[name = tensor<string, []>("op_1378_cast_fp16")];
            tensor<string, []> var_1380_equation_0 = const()[name = tensor<string, []>("op_1380_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1380_cast_fp16 = einsum(equation = var_1380_equation_0, values = (var_1170_cast_fp16, var_1330_cast_fp16))[name = tensor<string, []>("op_1380_cast_fp16")];
            tensor<string, []> var_1382_equation_0 = const()[name = tensor<string, []>("op_1382_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1382_cast_fp16 = einsum(equation = var_1382_equation_0, values = (var_1170_cast_fp16, var_1331_cast_fp16))[name = tensor<string, []>("op_1382_cast_fp16")];
            tensor<string, []> var_1384_equation_0 = const()[name = tensor<string, []>("op_1384_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1384_cast_fp16 = einsum(equation = var_1384_equation_0, values = (var_1170_cast_fp16, var_1332_cast_fp16))[name = tensor<string, []>("op_1384_cast_fp16")];
            tensor<string, []> var_1386_equation_0 = const()[name = tensor<string, []>("op_1386_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1386_cast_fp16 = einsum(equation = var_1386_equation_0, values = (var_1174_cast_fp16, var_1333_cast_fp16))[name = tensor<string, []>("op_1386_cast_fp16")];
            tensor<string, []> var_1388_equation_0 = const()[name = tensor<string, []>("op_1388_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1388_cast_fp16 = einsum(equation = var_1388_equation_0, values = (var_1174_cast_fp16, var_1334_cast_fp16))[name = tensor<string, []>("op_1388_cast_fp16")];
            tensor<string, []> var_1390_equation_0 = const()[name = tensor<string, []>("op_1390_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1390_cast_fp16 = einsum(equation = var_1390_equation_0, values = (var_1174_cast_fp16, var_1335_cast_fp16))[name = tensor<string, []>("op_1390_cast_fp16")];
            tensor<string, []> var_1392_equation_0 = const()[name = tensor<string, []>("op_1392_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1392_cast_fp16 = einsum(equation = var_1392_equation_0, values = (var_1174_cast_fp16, var_1336_cast_fp16))[name = tensor<string, []>("op_1392_cast_fp16")];
            tensor<string, []> var_1394_equation_0 = const()[name = tensor<string, []>("op_1394_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1394_cast_fp16 = einsum(equation = var_1394_equation_0, values = (var_1178_cast_fp16, var_1337_cast_fp16))[name = tensor<string, []>("op_1394_cast_fp16")];
            tensor<string, []> var_1396_equation_0 = const()[name = tensor<string, []>("op_1396_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1396_cast_fp16 = einsum(equation = var_1396_equation_0, values = (var_1178_cast_fp16, var_1338_cast_fp16))[name = tensor<string, []>("op_1396_cast_fp16")];
            tensor<string, []> var_1398_equation_0 = const()[name = tensor<string, []>("op_1398_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1398_cast_fp16 = einsum(equation = var_1398_equation_0, values = (var_1178_cast_fp16, var_1339_cast_fp16))[name = tensor<string, []>("op_1398_cast_fp16")];
            tensor<string, []> var_1400_equation_0 = const()[name = tensor<string, []>("op_1400_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1400_cast_fp16 = einsum(equation = var_1400_equation_0, values = (var_1178_cast_fp16, var_1340_cast_fp16))[name = tensor<string, []>("op_1400_cast_fp16")];
            tensor<string, []> var_1402_equation_0 = const()[name = tensor<string, []>("op_1402_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1402_cast_fp16 = einsum(equation = var_1402_equation_0, values = (var_1182_cast_fp16, var_1341_cast_fp16))[name = tensor<string, []>("op_1402_cast_fp16")];
            tensor<string, []> var_1404_equation_0 = const()[name = tensor<string, []>("op_1404_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1404_cast_fp16 = einsum(equation = var_1404_equation_0, values = (var_1182_cast_fp16, var_1342_cast_fp16))[name = tensor<string, []>("op_1404_cast_fp16")];
            tensor<string, []> var_1406_equation_0 = const()[name = tensor<string, []>("op_1406_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1406_cast_fp16 = einsum(equation = var_1406_equation_0, values = (var_1182_cast_fp16, var_1343_cast_fp16))[name = tensor<string, []>("op_1406_cast_fp16")];
            tensor<string, []> var_1408_equation_0 = const()[name = tensor<string, []>("op_1408_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_1408_cast_fp16 = einsum(equation = var_1408_equation_0, values = (var_1182_cast_fp16, var_1344_cast_fp16))[name = tensor<string, []>("op_1408_cast_fp16")];
            tensor<bool, []> var_1410_interleave_0 = const()[name = tensor<string, []>("op_1410_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_1410_cast_fp16 = concat(axis = var_797, interleave = var_1410_interleave_0, values = (var_1346_cast_fp16, var_1348_cast_fp16, var_1350_cast_fp16, var_1352_cast_fp16))[name = tensor<string, []>("op_1410_cast_fp16")];
            tensor<bool, []> var_1412_interleave_0 = const()[name = tensor<string, []>("op_1412_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_1412_cast_fp16 = concat(axis = var_797, interleave = var_1412_interleave_0, values = (var_1354_cast_fp16, var_1356_cast_fp16, var_1358_cast_fp16, var_1360_cast_fp16))[name = tensor<string, []>("op_1412_cast_fp16")];
            tensor<bool, []> var_1414_interleave_0 = const()[name = tensor<string, []>("op_1414_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_1414_cast_fp16 = concat(axis = var_797, interleave = var_1414_interleave_0, values = (var_1362_cast_fp16, var_1364_cast_fp16, var_1366_cast_fp16, var_1368_cast_fp16))[name = tensor<string, []>("op_1414_cast_fp16")];
            tensor<bool, []> var_1416_interleave_0 = const()[name = tensor<string, []>("op_1416_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_1416_cast_fp16 = concat(axis = var_797, interleave = var_1416_interleave_0, values = (var_1370_cast_fp16, var_1372_cast_fp16, var_1374_cast_fp16, var_1376_cast_fp16))[name = tensor<string, []>("op_1416_cast_fp16")];
            tensor<bool, []> var_1418_interleave_0 = const()[name = tensor<string, []>("op_1418_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_1418_cast_fp16 = concat(axis = var_797, interleave = var_1418_interleave_0, values = (var_1378_cast_fp16, var_1380_cast_fp16, var_1382_cast_fp16, var_1384_cast_fp16))[name = tensor<string, []>("op_1418_cast_fp16")];
            tensor<bool, []> var_1420_interleave_0 = const()[name = tensor<string, []>("op_1420_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_1420_cast_fp16 = concat(axis = var_797, interleave = var_1420_interleave_0, values = (var_1386_cast_fp16, var_1388_cast_fp16, var_1390_cast_fp16, var_1392_cast_fp16))[name = tensor<string, []>("op_1420_cast_fp16")];
            tensor<bool, []> var_1422_interleave_0 = const()[name = tensor<string, []>("op_1422_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_1422_cast_fp16 = concat(axis = var_797, interleave = var_1422_interleave_0, values = (var_1394_cast_fp16, var_1396_cast_fp16, var_1398_cast_fp16, var_1400_cast_fp16))[name = tensor<string, []>("op_1422_cast_fp16")];
            tensor<bool, []> var_1424_interleave_0 = const()[name = tensor<string, []>("op_1424_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_1424_cast_fp16 = concat(axis = var_797, interleave = var_1424_interleave_0, values = (var_1402_cast_fp16, var_1404_cast_fp16, var_1406_cast_fp16, var_1408_cast_fp16))[name = tensor<string, []>("op_1424_cast_fp16")];
            tensor<bool, []> input_9_interleave_0 = const()[name = tensor<string, []>("input_9_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 512, 1, 1500]> input_9_cast_fp16 = concat(axis = var_810, interleave = input_9_interleave_0, values = (var_1410_cast_fp16, var_1412_cast_fp16, var_1414_cast_fp16, var_1416_cast_fp16, var_1418_cast_fp16, var_1420_cast_fp16, var_1422_cast_fp16, var_1424_cast_fp16))[name = tensor<string, []>("input_9_cast_fp16")];
            tensor<int32, [2]> var_1429 = const()[name = tensor<string, []>("op_1429"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1431 = const()[name = tensor<string, []>("op_1431"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_7_pad_type_0 = const()[name = tensor<string, []>("obj_7_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_7_pad_0 = const()[name = tensor<string, []>("obj_7_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_1_self_attn_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_o_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11241344)))];
            tensor<fp16, [512]> layers_1_self_attn_o_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_self_attn_o_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11765696)))];
            tensor<fp16, [1, 512, 1, 1500]> obj_7_cast_fp16 = conv(bias = layers_1_self_attn_o_proj_bias_to_fp16, dilations = var_1431, groups = var_810, pad = obj_7_pad_0, pad_type = obj_7_pad_type_0, strides = var_1429, weight = layers_1_self_attn_o_proj_weight_to_fp16, x = input_9_cast_fp16)[name = tensor<string, []>("obj_7_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_7_cast_fp16 = add(x = inputs_5_cast_fp16, y = obj_7_cast_fp16)[name = tensor<string, []>("inputs_7_cast_fp16")];
            tensor<int32, [1]> var_1437 = const()[name = tensor<string, []>("op_1437"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_7_cast_fp16 = reduce_mean(axes = var_1437, keep_dims = var_811, x = inputs_7_cast_fp16)[name = tensor<string, []>("channels_mean_7_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_7_cast_fp16 = sub(x = inputs_7_cast_fp16, y = channels_mean_7_cast_fp16)[name = tensor<string, []>("zero_mean_7_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_7_cast_fp16 = mul(x = zero_mean_7_cast_fp16, y = zero_mean_7_cast_fp16)[name = tensor<string, []>("zero_mean_sq_7_cast_fp16")];
            tensor<int32, [1]> var_1441 = const()[name = tensor<string, []>("op_1441"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_1442_cast_fp16 = reduce_mean(axes = var_1441, keep_dims = var_811, x = zero_mean_sq_7_cast_fp16)[name = tensor<string, []>("op_1442_cast_fp16")];
            tensor<fp16, []> var_1443_to_fp16 = const()[name = tensor<string, []>("op_1443_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_1444_cast_fp16 = add(x = var_1442_cast_fp16, y = var_1443_to_fp16)[name = tensor<string, []>("op_1444_cast_fp16")];
            tensor<fp16, []> denom_7_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_7_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_7_cast_fp16 = rsqrt(epsilon = denom_7_epsilon_0_to_fp16, x = var_1444_cast_fp16)[name = tensor<string, []>("denom_7_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_7_cast_fp16 = mul(x = zero_mean_7_cast_fp16, y = denom_7_cast_fp16)[name = tensor<string, []>("out_7_cast_fp16")];
            tensor<fp16, [512]> input_11_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_11_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11766784)))];
            tensor<fp16, [512]> input_11_beta_0_to_fp16 = const()[name = tensor<string, []>("input_11_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11767872)))];
            tensor<fp16, []> input_11_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_11_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> input_11_cast_fp16 = batch_norm(beta = input_11_beta_0_to_fp16, epsilon = input_11_epsilon_0_to_fp16, gamma = input_11_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_7_cast_fp16)[name = tensor<string, []>("input_11_cast_fp16")];
            tensor<int32, [2]> var_1455 = const()[name = tensor<string, []>("op_1455"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1457 = const()[name = tensor<string, []>("op_1457"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> input_13_pad_type_0 = const()[name = tensor<string, []>("input_13_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> input_13_pad_0 = const()[name = tensor<string, []>("input_13_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [2048, 512, 1, 1]> layers_1_fc1_weight_to_fp16 = const()[name = tensor<string, []>("layers_1_fc1_weight_to_fp16"), val = tensor<fp16, [2048, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(11768960)))];
            tensor<fp16, [2048]> layers_1_fc1_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_fc1_bias_to_fp16"), val = tensor<fp16, [2048]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13866176)))];
            tensor<fp16, [1, 2048, 1, 1500]> input_13_cast_fp16 = conv(bias = layers_1_fc1_bias_to_fp16, dilations = var_1457, groups = var_810, pad = input_13_pad_0, pad_type = input_13_pad_type_0, strides = var_1455, weight = layers_1_fc1_weight_to_fp16, x = input_11_cast_fp16)[name = tensor<string, []>("input_13_cast_fp16")];
            tensor<string, []> input_15_mode_0 = const()[name = tensor<string, []>("input_15_mode_0"), val = tensor<string, []>("EXACT")];
            tensor<fp16, [1, 2048, 1, 1500]> input_15_cast_fp16 = gelu(mode = input_15_mode_0, x = input_13_cast_fp16)[name = tensor<string, []>("input_15_cast_fp16")];
            tensor<int32, [2]> var_1463 = const()[name = tensor<string, []>("op_1463"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1465 = const()[name = tensor<string, []>("op_1465"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> hidden_states_7_pad_type_0 = const()[name = tensor<string, []>("hidden_states_7_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> hidden_states_7_pad_0 = const()[name = tensor<string, []>("hidden_states_7_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 2048, 1, 1]> layers_1_fc2_weight_to_fp16 = const()[name = tensor<string, []>("layers_1_fc2_weight_to_fp16"), val = tensor<fp16, [512, 2048, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(13870336)))];
            tensor<fp16, [512]> layers_1_fc2_bias_to_fp16 = const()[name = tensor<string, []>("layers_1_fc2_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(15967552)))];
            tensor<fp16, [1, 512, 1, 1500]> hidden_states_7_cast_fp16 = conv(bias = layers_1_fc2_bias_to_fp16, dilations = var_1465, groups = var_810, pad = hidden_states_7_pad_0, pad_type = hidden_states_7_pad_type_0, strides = var_1463, weight = layers_1_fc2_weight_to_fp16, x = input_15_cast_fp16)[name = tensor<string, []>("hidden_states_7_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_9_cast_fp16 = add(x = inputs_7_cast_fp16, y = hidden_states_7_cast_fp16)[name = tensor<string, []>("inputs_9_cast_fp16")];
            tensor<int32, []> var_1472 = const()[name = tensor<string, []>("op_1472"), val = tensor<int32, []>(3)];
            tensor<int32, []> var_1485 = const()[name = tensor<string, []>("op_1485"), val = tensor<int32, []>(1)];
            tensor<bool, []> var_1486 = const()[name = tensor<string, []>("op_1486"), val = tensor<bool, []>(true)];
            tensor<int32, [1]> var_1496 = const()[name = tensor<string, []>("op_1496"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_9_cast_fp16 = reduce_mean(axes = var_1496, keep_dims = var_1486, x = inputs_9_cast_fp16)[name = tensor<string, []>("channels_mean_9_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_9_cast_fp16 = sub(x = inputs_9_cast_fp16, y = channels_mean_9_cast_fp16)[name = tensor<string, []>("zero_mean_9_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_9_cast_fp16 = mul(x = zero_mean_9_cast_fp16, y = zero_mean_9_cast_fp16)[name = tensor<string, []>("zero_mean_sq_9_cast_fp16")];
            tensor<int32, [1]> var_1500 = const()[name = tensor<string, []>("op_1500"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_1501_cast_fp16 = reduce_mean(axes = var_1500, keep_dims = var_1486, x = zero_mean_sq_9_cast_fp16)[name = tensor<string, []>("op_1501_cast_fp16")];
            tensor<fp16, []> var_1502_to_fp16 = const()[name = tensor<string, []>("op_1502_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_1503_cast_fp16 = add(x = var_1501_cast_fp16, y = var_1502_to_fp16)[name = tensor<string, []>("op_1503_cast_fp16")];
            tensor<fp16, []> denom_9_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_9_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_9_cast_fp16 = rsqrt(epsilon = denom_9_epsilon_0_to_fp16, x = var_1503_cast_fp16)[name = tensor<string, []>("denom_9_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_9_cast_fp16 = mul(x = zero_mean_9_cast_fp16, y = denom_9_cast_fp16)[name = tensor<string, []>("out_9_cast_fp16")];
            tensor<fp16, [512]> obj_9_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_9_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(15968640)))];
            tensor<fp16, [512]> obj_9_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_9_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(15969728)))];
            tensor<fp16, []> obj_9_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_9_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> obj_9_cast_fp16 = batch_norm(beta = obj_9_beta_0_to_fp16, epsilon = obj_9_epsilon_0_to_fp16, gamma = obj_9_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_9_cast_fp16)[name = tensor<string, []>("obj_9_cast_fp16")];
            tensor<int32, [2]> var_1518 = const()[name = tensor<string, []>("op_1518"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1520 = const()[name = tensor<string, []>("op_1520"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_5_pad_type_0 = const()[name = tensor<string, []>("query_5_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_5_pad_0 = const()[name = tensor<string, []>("query_5_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_2_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(15970816)))];
            tensor<fp16, [512]> layers_2_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16495168)))];
            tensor<fp16, [1, 512, 1, 1500]> query_5_cast_fp16 = conv(bias = layers_2_self_attn_q_proj_bias_to_fp16, dilations = var_1520, groups = var_1485, pad = query_5_pad_0, pad_type = query_5_pad_type_0, strides = var_1518, weight = layers_2_self_attn_q_proj_weight_to_fp16, x = obj_9_cast_fp16)[name = tensor<string, []>("query_5_cast_fp16")];
            tensor<int32, [2]> var_1524 = const()[name = tensor<string, []>("op_1524"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1526 = const()[name = tensor<string, []>("op_1526"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_5_pad_type_0 = const()[name = tensor<string, []>("key_5_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_5_pad_0 = const()[name = tensor<string, []>("key_5_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_2_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(16496256)))];
            tensor<fp16, [1, 512, 1, 1500]> key_5_cast_fp16 = conv(dilations = var_1526, groups = var_1485, pad = key_5_pad_0, pad_type = key_5_pad_type_0, strides = var_1524, weight = layers_2_self_attn_k_proj_weight_to_fp16, x = obj_9_cast_fp16)[name = tensor<string, []>("key_5_cast_fp16")];
            tensor<int32, [2]> var_1531 = const()[name = tensor<string, []>("op_1531"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_1533 = const()[name = tensor<string, []>("op_1533"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_5_pad_type_0 = const()[name = tensor<string, []>("value_5_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_5_pad_0 = const()[name = tensor<string, []>("value_5_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_2_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17020608)))];
            tensor<fp16, [512]> layers_2_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17544960)))];
            tensor<fp16, [1, 512, 1, 1500]> value_5_cast_fp16 = conv(bias = layers_2_self_attn_v_proj_bias_to_fp16, dilations = var_1533, groups = var_1485, pad = value_5_pad_0, pad_type = value_5_pad_type_0, strides = var_1531, weight = layers_2_self_attn_v_proj_weight_to_fp16, x = obj_9_cast_fp16)[name = tensor<string, []>("value_5_cast_fp16")];
            tensor<int32, [4]> var_1540_begin_0 = const()[name = tensor<string, []>("op_1540_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1540_end_0 = const()[name = tensor<string, []>("op_1540_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1540_end_mask_0 = const()[name = tensor<string, []>("op_1540_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1540_cast_fp16 = slice_by_index(begin = var_1540_begin_0, end = var_1540_end_0, end_mask = var_1540_end_mask_0, x = query_5_cast_fp16)[name = tensor<string, []>("op_1540_cast_fp16")];
            tensor<int32, [4]> var_1544_begin_0 = const()[name = tensor<string, []>("op_1544_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_1544_end_0 = const()[name = tensor<string, []>("op_1544_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_1544_end_mask_0 = const()[name = tensor<string, []>("op_1544_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1544_cast_fp16 = slice_by_index(begin = var_1544_begin_0, end = var_1544_end_0, end_mask = var_1544_end_mask_0, x = query_5_cast_fp16)[name = tensor<string, []>("op_1544_cast_fp16")];
            tensor<int32, [4]> var_1548_begin_0 = const()[name = tensor<string, []>("op_1548_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_1548_end_0 = const()[name = tensor<string, []>("op_1548_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_1548_end_mask_0 = const()[name = tensor<string, []>("op_1548_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1548_cast_fp16 = slice_by_index(begin = var_1548_begin_0, end = var_1548_end_0, end_mask = var_1548_end_mask_0, x = query_5_cast_fp16)[name = tensor<string, []>("op_1548_cast_fp16")];
            tensor<int32, [4]> var_1552_begin_0 = const()[name = tensor<string, []>("op_1552_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_1552_end_0 = const()[name = tensor<string, []>("op_1552_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_1552_end_mask_0 = const()[name = tensor<string, []>("op_1552_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1552_cast_fp16 = slice_by_index(begin = var_1552_begin_0, end = var_1552_end_0, end_mask = var_1552_end_mask_0, x = query_5_cast_fp16)[name = tensor<string, []>("op_1552_cast_fp16")];
            tensor<int32, [4]> var_1556_begin_0 = const()[name = tensor<string, []>("op_1556_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_1556_end_0 = const()[name = tensor<string, []>("op_1556_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_1556_end_mask_0 = const()[name = tensor<string, []>("op_1556_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1556_cast_fp16 = slice_by_index(begin = var_1556_begin_0, end = var_1556_end_0, end_mask = var_1556_end_mask_0, x = query_5_cast_fp16)[name = tensor<string, []>("op_1556_cast_fp16")];
            tensor<int32, [4]> var_1560_begin_0 = const()[name = tensor<string, []>("op_1560_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_1560_end_0 = const()[name = tensor<string, []>("op_1560_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_1560_end_mask_0 = const()[name = tensor<string, []>("op_1560_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1560_cast_fp16 = slice_by_index(begin = var_1560_begin_0, end = var_1560_end_0, end_mask = var_1560_end_mask_0, x = query_5_cast_fp16)[name = tensor<string, []>("op_1560_cast_fp16")];
            tensor<int32, [4]> var_1564_begin_0 = const()[name = tensor<string, []>("op_1564_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_1564_end_0 = const()[name = tensor<string, []>("op_1564_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_1564_end_mask_0 = const()[name = tensor<string, []>("op_1564_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1564_cast_fp16 = slice_by_index(begin = var_1564_begin_0, end = var_1564_end_0, end_mask = var_1564_end_mask_0, x = query_5_cast_fp16)[name = tensor<string, []>("op_1564_cast_fp16")];
            tensor<int32, [4]> var_1568_begin_0 = const()[name = tensor<string, []>("op_1568_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_1568_end_0 = const()[name = tensor<string, []>("op_1568_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_1568_end_mask_0 = const()[name = tensor<string, []>("op_1568_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1568_cast_fp16 = slice_by_index(begin = var_1568_begin_0, end = var_1568_end_0, end_mask = var_1568_end_mask_0, x = query_5_cast_fp16)[name = tensor<string, []>("op_1568_cast_fp16")];
            tensor<int32, [4]> var_1577_begin_0 = const()[name = tensor<string, []>("op_1577_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1577_end_0 = const()[name = tensor<string, []>("op_1577_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1577_end_mask_0 = const()[name = tensor<string, []>("op_1577_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1577_cast_fp16 = slice_by_index(begin = var_1577_begin_0, end = var_1577_end_0, end_mask = var_1577_end_mask_0, x = var_1540_cast_fp16)[name = tensor<string, []>("op_1577_cast_fp16")];
            tensor<int32, [4]> var_1584_begin_0 = const()[name = tensor<string, []>("op_1584_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1584_end_0 = const()[name = tensor<string, []>("op_1584_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1584_end_mask_0 = const()[name = tensor<string, []>("op_1584_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1584_cast_fp16 = slice_by_index(begin = var_1584_begin_0, end = var_1584_end_0, end_mask = var_1584_end_mask_0, x = var_1540_cast_fp16)[name = tensor<string, []>("op_1584_cast_fp16")];
            tensor<int32, [4]> var_1591_begin_0 = const()[name = tensor<string, []>("op_1591_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1591_end_0 = const()[name = tensor<string, []>("op_1591_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1591_end_mask_0 = const()[name = tensor<string, []>("op_1591_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1591_cast_fp16 = slice_by_index(begin = var_1591_begin_0, end = var_1591_end_0, end_mask = var_1591_end_mask_0, x = var_1540_cast_fp16)[name = tensor<string, []>("op_1591_cast_fp16")];
            tensor<int32, [4]> var_1598_begin_0 = const()[name = tensor<string, []>("op_1598_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1598_end_0 = const()[name = tensor<string, []>("op_1598_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1598_end_mask_0 = const()[name = tensor<string, []>("op_1598_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1598_cast_fp16 = slice_by_index(begin = var_1598_begin_0, end = var_1598_end_0, end_mask = var_1598_end_mask_0, x = var_1540_cast_fp16)[name = tensor<string, []>("op_1598_cast_fp16")];
            tensor<int32, [4]> var_1605_begin_0 = const()[name = tensor<string, []>("op_1605_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1605_end_0 = const()[name = tensor<string, []>("op_1605_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1605_end_mask_0 = const()[name = tensor<string, []>("op_1605_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1605_cast_fp16 = slice_by_index(begin = var_1605_begin_0, end = var_1605_end_0, end_mask = var_1605_end_mask_0, x = var_1544_cast_fp16)[name = tensor<string, []>("op_1605_cast_fp16")];
            tensor<int32, [4]> var_1612_begin_0 = const()[name = tensor<string, []>("op_1612_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1612_end_0 = const()[name = tensor<string, []>("op_1612_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1612_end_mask_0 = const()[name = tensor<string, []>("op_1612_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1612_cast_fp16 = slice_by_index(begin = var_1612_begin_0, end = var_1612_end_0, end_mask = var_1612_end_mask_0, x = var_1544_cast_fp16)[name = tensor<string, []>("op_1612_cast_fp16")];
            tensor<int32, [4]> var_1619_begin_0 = const()[name = tensor<string, []>("op_1619_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1619_end_0 = const()[name = tensor<string, []>("op_1619_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1619_end_mask_0 = const()[name = tensor<string, []>("op_1619_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1619_cast_fp16 = slice_by_index(begin = var_1619_begin_0, end = var_1619_end_0, end_mask = var_1619_end_mask_0, x = var_1544_cast_fp16)[name = tensor<string, []>("op_1619_cast_fp16")];
            tensor<int32, [4]> var_1626_begin_0 = const()[name = tensor<string, []>("op_1626_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1626_end_0 = const()[name = tensor<string, []>("op_1626_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1626_end_mask_0 = const()[name = tensor<string, []>("op_1626_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1626_cast_fp16 = slice_by_index(begin = var_1626_begin_0, end = var_1626_end_0, end_mask = var_1626_end_mask_0, x = var_1544_cast_fp16)[name = tensor<string, []>("op_1626_cast_fp16")];
            tensor<int32, [4]> var_1633_begin_0 = const()[name = tensor<string, []>("op_1633_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1633_end_0 = const()[name = tensor<string, []>("op_1633_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1633_end_mask_0 = const()[name = tensor<string, []>("op_1633_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1633_cast_fp16 = slice_by_index(begin = var_1633_begin_0, end = var_1633_end_0, end_mask = var_1633_end_mask_0, x = var_1548_cast_fp16)[name = tensor<string, []>("op_1633_cast_fp16")];
            tensor<int32, [4]> var_1640_begin_0 = const()[name = tensor<string, []>("op_1640_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1640_end_0 = const()[name = tensor<string, []>("op_1640_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1640_end_mask_0 = const()[name = tensor<string, []>("op_1640_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1640_cast_fp16 = slice_by_index(begin = var_1640_begin_0, end = var_1640_end_0, end_mask = var_1640_end_mask_0, x = var_1548_cast_fp16)[name = tensor<string, []>("op_1640_cast_fp16")];
            tensor<int32, [4]> var_1647_begin_0 = const()[name = tensor<string, []>("op_1647_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1647_end_0 = const()[name = tensor<string, []>("op_1647_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1647_end_mask_0 = const()[name = tensor<string, []>("op_1647_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1647_cast_fp16 = slice_by_index(begin = var_1647_begin_0, end = var_1647_end_0, end_mask = var_1647_end_mask_0, x = var_1548_cast_fp16)[name = tensor<string, []>("op_1647_cast_fp16")];
            tensor<int32, [4]> var_1654_begin_0 = const()[name = tensor<string, []>("op_1654_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1654_end_0 = const()[name = tensor<string, []>("op_1654_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1654_end_mask_0 = const()[name = tensor<string, []>("op_1654_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1654_cast_fp16 = slice_by_index(begin = var_1654_begin_0, end = var_1654_end_0, end_mask = var_1654_end_mask_0, x = var_1548_cast_fp16)[name = tensor<string, []>("op_1654_cast_fp16")];
            tensor<int32, [4]> var_1661_begin_0 = const()[name = tensor<string, []>("op_1661_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1661_end_0 = const()[name = tensor<string, []>("op_1661_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1661_end_mask_0 = const()[name = tensor<string, []>("op_1661_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1661_cast_fp16 = slice_by_index(begin = var_1661_begin_0, end = var_1661_end_0, end_mask = var_1661_end_mask_0, x = var_1552_cast_fp16)[name = tensor<string, []>("op_1661_cast_fp16")];
            tensor<int32, [4]> var_1668_begin_0 = const()[name = tensor<string, []>("op_1668_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1668_end_0 = const()[name = tensor<string, []>("op_1668_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1668_end_mask_0 = const()[name = tensor<string, []>("op_1668_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1668_cast_fp16 = slice_by_index(begin = var_1668_begin_0, end = var_1668_end_0, end_mask = var_1668_end_mask_0, x = var_1552_cast_fp16)[name = tensor<string, []>("op_1668_cast_fp16")];
            tensor<int32, [4]> var_1675_begin_0 = const()[name = tensor<string, []>("op_1675_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1675_end_0 = const()[name = tensor<string, []>("op_1675_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1675_end_mask_0 = const()[name = tensor<string, []>("op_1675_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1675_cast_fp16 = slice_by_index(begin = var_1675_begin_0, end = var_1675_end_0, end_mask = var_1675_end_mask_0, x = var_1552_cast_fp16)[name = tensor<string, []>("op_1675_cast_fp16")];
            tensor<int32, [4]> var_1682_begin_0 = const()[name = tensor<string, []>("op_1682_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1682_end_0 = const()[name = tensor<string, []>("op_1682_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1682_end_mask_0 = const()[name = tensor<string, []>("op_1682_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1682_cast_fp16 = slice_by_index(begin = var_1682_begin_0, end = var_1682_end_0, end_mask = var_1682_end_mask_0, x = var_1552_cast_fp16)[name = tensor<string, []>("op_1682_cast_fp16")];
            tensor<int32, [4]> var_1689_begin_0 = const()[name = tensor<string, []>("op_1689_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1689_end_0 = const()[name = tensor<string, []>("op_1689_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1689_end_mask_0 = const()[name = tensor<string, []>("op_1689_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1689_cast_fp16 = slice_by_index(begin = var_1689_begin_0, end = var_1689_end_0, end_mask = var_1689_end_mask_0, x = var_1556_cast_fp16)[name = tensor<string, []>("op_1689_cast_fp16")];
            tensor<int32, [4]> var_1696_begin_0 = const()[name = tensor<string, []>("op_1696_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1696_end_0 = const()[name = tensor<string, []>("op_1696_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1696_end_mask_0 = const()[name = tensor<string, []>("op_1696_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1696_cast_fp16 = slice_by_index(begin = var_1696_begin_0, end = var_1696_end_0, end_mask = var_1696_end_mask_0, x = var_1556_cast_fp16)[name = tensor<string, []>("op_1696_cast_fp16")];
            tensor<int32, [4]> var_1703_begin_0 = const()[name = tensor<string, []>("op_1703_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1703_end_0 = const()[name = tensor<string, []>("op_1703_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1703_end_mask_0 = const()[name = tensor<string, []>("op_1703_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1703_cast_fp16 = slice_by_index(begin = var_1703_begin_0, end = var_1703_end_0, end_mask = var_1703_end_mask_0, x = var_1556_cast_fp16)[name = tensor<string, []>("op_1703_cast_fp16")];
            tensor<int32, [4]> var_1710_begin_0 = const()[name = tensor<string, []>("op_1710_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1710_end_0 = const()[name = tensor<string, []>("op_1710_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1710_end_mask_0 = const()[name = tensor<string, []>("op_1710_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1710_cast_fp16 = slice_by_index(begin = var_1710_begin_0, end = var_1710_end_0, end_mask = var_1710_end_mask_0, x = var_1556_cast_fp16)[name = tensor<string, []>("op_1710_cast_fp16")];
            tensor<int32, [4]> var_1717_begin_0 = const()[name = tensor<string, []>("op_1717_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1717_end_0 = const()[name = tensor<string, []>("op_1717_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1717_end_mask_0 = const()[name = tensor<string, []>("op_1717_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1717_cast_fp16 = slice_by_index(begin = var_1717_begin_0, end = var_1717_end_0, end_mask = var_1717_end_mask_0, x = var_1560_cast_fp16)[name = tensor<string, []>("op_1717_cast_fp16")];
            tensor<int32, [4]> var_1724_begin_0 = const()[name = tensor<string, []>("op_1724_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1724_end_0 = const()[name = tensor<string, []>("op_1724_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1724_end_mask_0 = const()[name = tensor<string, []>("op_1724_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1724_cast_fp16 = slice_by_index(begin = var_1724_begin_0, end = var_1724_end_0, end_mask = var_1724_end_mask_0, x = var_1560_cast_fp16)[name = tensor<string, []>("op_1724_cast_fp16")];
            tensor<int32, [4]> var_1731_begin_0 = const()[name = tensor<string, []>("op_1731_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1731_end_0 = const()[name = tensor<string, []>("op_1731_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1731_end_mask_0 = const()[name = tensor<string, []>("op_1731_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1731_cast_fp16 = slice_by_index(begin = var_1731_begin_0, end = var_1731_end_0, end_mask = var_1731_end_mask_0, x = var_1560_cast_fp16)[name = tensor<string, []>("op_1731_cast_fp16")];
            tensor<int32, [4]> var_1738_begin_0 = const()[name = tensor<string, []>("op_1738_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1738_end_0 = const()[name = tensor<string, []>("op_1738_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1738_end_mask_0 = const()[name = tensor<string, []>("op_1738_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1738_cast_fp16 = slice_by_index(begin = var_1738_begin_0, end = var_1738_end_0, end_mask = var_1738_end_mask_0, x = var_1560_cast_fp16)[name = tensor<string, []>("op_1738_cast_fp16")];
            tensor<int32, [4]> var_1745_begin_0 = const()[name = tensor<string, []>("op_1745_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1745_end_0 = const()[name = tensor<string, []>("op_1745_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1745_end_mask_0 = const()[name = tensor<string, []>("op_1745_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1745_cast_fp16 = slice_by_index(begin = var_1745_begin_0, end = var_1745_end_0, end_mask = var_1745_end_mask_0, x = var_1564_cast_fp16)[name = tensor<string, []>("op_1745_cast_fp16")];
            tensor<int32, [4]> var_1752_begin_0 = const()[name = tensor<string, []>("op_1752_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1752_end_0 = const()[name = tensor<string, []>("op_1752_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1752_end_mask_0 = const()[name = tensor<string, []>("op_1752_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1752_cast_fp16 = slice_by_index(begin = var_1752_begin_0, end = var_1752_end_0, end_mask = var_1752_end_mask_0, x = var_1564_cast_fp16)[name = tensor<string, []>("op_1752_cast_fp16")];
            tensor<int32, [4]> var_1759_begin_0 = const()[name = tensor<string, []>("op_1759_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1759_end_0 = const()[name = tensor<string, []>("op_1759_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1759_end_mask_0 = const()[name = tensor<string, []>("op_1759_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1759_cast_fp16 = slice_by_index(begin = var_1759_begin_0, end = var_1759_end_0, end_mask = var_1759_end_mask_0, x = var_1564_cast_fp16)[name = tensor<string, []>("op_1759_cast_fp16")];
            tensor<int32, [4]> var_1766_begin_0 = const()[name = tensor<string, []>("op_1766_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1766_end_0 = const()[name = tensor<string, []>("op_1766_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1766_end_mask_0 = const()[name = tensor<string, []>("op_1766_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1766_cast_fp16 = slice_by_index(begin = var_1766_begin_0, end = var_1766_end_0, end_mask = var_1766_end_mask_0, x = var_1564_cast_fp16)[name = tensor<string, []>("op_1766_cast_fp16")];
            tensor<int32, [4]> var_1773_begin_0 = const()[name = tensor<string, []>("op_1773_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1773_end_0 = const()[name = tensor<string, []>("op_1773_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_1773_end_mask_0 = const()[name = tensor<string, []>("op_1773_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1773_cast_fp16 = slice_by_index(begin = var_1773_begin_0, end = var_1773_end_0, end_mask = var_1773_end_mask_0, x = var_1568_cast_fp16)[name = tensor<string, []>("op_1773_cast_fp16")];
            tensor<int32, [4]> var_1780_begin_0 = const()[name = tensor<string, []>("op_1780_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_1780_end_0 = const()[name = tensor<string, []>("op_1780_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_1780_end_mask_0 = const()[name = tensor<string, []>("op_1780_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1780_cast_fp16 = slice_by_index(begin = var_1780_begin_0, end = var_1780_end_0, end_mask = var_1780_end_mask_0, x = var_1568_cast_fp16)[name = tensor<string, []>("op_1780_cast_fp16")];
            tensor<int32, [4]> var_1787_begin_0 = const()[name = tensor<string, []>("op_1787_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_1787_end_0 = const()[name = tensor<string, []>("op_1787_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_1787_end_mask_0 = const()[name = tensor<string, []>("op_1787_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1787_cast_fp16 = slice_by_index(begin = var_1787_begin_0, end = var_1787_end_0, end_mask = var_1787_end_mask_0, x = var_1568_cast_fp16)[name = tensor<string, []>("op_1787_cast_fp16")];
            tensor<int32, [4]> var_1794_begin_0 = const()[name = tensor<string, []>("op_1794_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_1794_end_0 = const()[name = tensor<string, []>("op_1794_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1794_end_mask_0 = const()[name = tensor<string, []>("op_1794_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_1794_cast_fp16 = slice_by_index(begin = var_1794_begin_0, end = var_1794_end_0, end_mask = var_1794_end_mask_0, x = var_1568_cast_fp16)[name = tensor<string, []>("op_1794_cast_fp16")];
            tensor<int32, [4]> k_5_perm_0 = const()[name = tensor<string, []>("k_5_perm_0"), val = tensor<int32, [4]>([0, 3, 2, 1])];
            tensor<int32, [4]> var_1799_begin_0 = const()[name = tensor<string, []>("op_1799_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1799_end_0 = const()[name = tensor<string, []>("op_1799_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 64])];
            tensor<bool, [4]> var_1799_end_mask_0 = const()[name = tensor<string, []>("op_1799_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 512]> transpose_3 = transpose(perm = k_5_perm_0, x = key_5_cast_fp16)[name = tensor<string, []>("transpose_3")];
            tensor<fp16, [1, 1500, 1, 64]> var_1799_cast_fp16 = slice_by_index(begin = var_1799_begin_0, end = var_1799_end_0, end_mask = var_1799_end_mask_0, x = transpose_3)[name = tensor<string, []>("op_1799_cast_fp16")];
            tensor<int32, [4]> var_1803_begin_0 = const()[name = tensor<string, []>("op_1803_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 64])];
            tensor<int32, [4]> var_1803_end_0 = const()[name = tensor<string, []>("op_1803_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 128])];
            tensor<bool, [4]> var_1803_end_mask_0 = const()[name = tensor<string, []>("op_1803_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1803_cast_fp16 = slice_by_index(begin = var_1803_begin_0, end = var_1803_end_0, end_mask = var_1803_end_mask_0, x = transpose_3)[name = tensor<string, []>("op_1803_cast_fp16")];
            tensor<int32, [4]> var_1807_begin_0 = const()[name = tensor<string, []>("op_1807_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 128])];
            tensor<int32, [4]> var_1807_end_0 = const()[name = tensor<string, []>("op_1807_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 192])];
            tensor<bool, [4]> var_1807_end_mask_0 = const()[name = tensor<string, []>("op_1807_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1807_cast_fp16 = slice_by_index(begin = var_1807_begin_0, end = var_1807_end_0, end_mask = var_1807_end_mask_0, x = transpose_3)[name = tensor<string, []>("op_1807_cast_fp16")];
            tensor<int32, [4]> var_1811_begin_0 = const()[name = tensor<string, []>("op_1811_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 192])];
            tensor<int32, [4]> var_1811_end_0 = const()[name = tensor<string, []>("op_1811_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 256])];
            tensor<bool, [4]> var_1811_end_mask_0 = const()[name = tensor<string, []>("op_1811_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1811_cast_fp16 = slice_by_index(begin = var_1811_begin_0, end = var_1811_end_0, end_mask = var_1811_end_mask_0, x = transpose_3)[name = tensor<string, []>("op_1811_cast_fp16")];
            tensor<int32, [4]> var_1815_begin_0 = const()[name = tensor<string, []>("op_1815_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 256])];
            tensor<int32, [4]> var_1815_end_0 = const()[name = tensor<string, []>("op_1815_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 320])];
            tensor<bool, [4]> var_1815_end_mask_0 = const()[name = tensor<string, []>("op_1815_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1815_cast_fp16 = slice_by_index(begin = var_1815_begin_0, end = var_1815_end_0, end_mask = var_1815_end_mask_0, x = transpose_3)[name = tensor<string, []>("op_1815_cast_fp16")];
            tensor<int32, [4]> var_1819_begin_0 = const()[name = tensor<string, []>("op_1819_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 320])];
            tensor<int32, [4]> var_1819_end_0 = const()[name = tensor<string, []>("op_1819_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 384])];
            tensor<bool, [4]> var_1819_end_mask_0 = const()[name = tensor<string, []>("op_1819_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1819_cast_fp16 = slice_by_index(begin = var_1819_begin_0, end = var_1819_end_0, end_mask = var_1819_end_mask_0, x = transpose_3)[name = tensor<string, []>("op_1819_cast_fp16")];
            tensor<int32, [4]> var_1823_begin_0 = const()[name = tensor<string, []>("op_1823_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 384])];
            tensor<int32, [4]> var_1823_end_0 = const()[name = tensor<string, []>("op_1823_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 448])];
            tensor<bool, [4]> var_1823_end_mask_0 = const()[name = tensor<string, []>("op_1823_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1823_cast_fp16 = slice_by_index(begin = var_1823_begin_0, end = var_1823_end_0, end_mask = var_1823_end_mask_0, x = transpose_3)[name = tensor<string, []>("op_1823_cast_fp16")];
            tensor<int32, [4]> var_1827_begin_0 = const()[name = tensor<string, []>("op_1827_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 448])];
            tensor<int32, [4]> var_1827_end_0 = const()[name = tensor<string, []>("op_1827_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 512])];
            tensor<bool, [4]> var_1827_end_mask_0 = const()[name = tensor<string, []>("op_1827_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_1827_cast_fp16 = slice_by_index(begin = var_1827_begin_0, end = var_1827_end_0, end_mask = var_1827_end_mask_0, x = transpose_3)[name = tensor<string, []>("op_1827_cast_fp16")];
            tensor<int32, [4]> var_1829_begin_0 = const()[name = tensor<string, []>("op_1829_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_1829_end_0 = const()[name = tensor<string, []>("op_1829_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_1829_end_mask_0 = const()[name = tensor<string, []>("op_1829_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1829_cast_fp16 = slice_by_index(begin = var_1829_begin_0, end = var_1829_end_0, end_mask = var_1829_end_mask_0, x = value_5_cast_fp16)[name = tensor<string, []>("op_1829_cast_fp16")];
            tensor<int32, [4]> var_1833_begin_0 = const()[name = tensor<string, []>("op_1833_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_1833_end_0 = const()[name = tensor<string, []>("op_1833_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_1833_end_mask_0 = const()[name = tensor<string, []>("op_1833_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1833_cast_fp16 = slice_by_index(begin = var_1833_begin_0, end = var_1833_end_0, end_mask = var_1833_end_mask_0, x = value_5_cast_fp16)[name = tensor<string, []>("op_1833_cast_fp16")];
            tensor<int32, [4]> var_1837_begin_0 = const()[name = tensor<string, []>("op_1837_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_1837_end_0 = const()[name = tensor<string, []>("op_1837_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_1837_end_mask_0 = const()[name = tensor<string, []>("op_1837_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1837_cast_fp16 = slice_by_index(begin = var_1837_begin_0, end = var_1837_end_0, end_mask = var_1837_end_mask_0, x = value_5_cast_fp16)[name = tensor<string, []>("op_1837_cast_fp16")];
            tensor<int32, [4]> var_1841_begin_0 = const()[name = tensor<string, []>("op_1841_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_1841_end_0 = const()[name = tensor<string, []>("op_1841_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_1841_end_mask_0 = const()[name = tensor<string, []>("op_1841_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1841_cast_fp16 = slice_by_index(begin = var_1841_begin_0, end = var_1841_end_0, end_mask = var_1841_end_mask_0, x = value_5_cast_fp16)[name = tensor<string, []>("op_1841_cast_fp16")];
            tensor<int32, [4]> var_1845_begin_0 = const()[name = tensor<string, []>("op_1845_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_1845_end_0 = const()[name = tensor<string, []>("op_1845_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_1845_end_mask_0 = const()[name = tensor<string, []>("op_1845_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1845_cast_fp16 = slice_by_index(begin = var_1845_begin_0, end = var_1845_end_0, end_mask = var_1845_end_mask_0, x = value_5_cast_fp16)[name = tensor<string, []>("op_1845_cast_fp16")];
            tensor<int32, [4]> var_1849_begin_0 = const()[name = tensor<string, []>("op_1849_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_1849_end_0 = const()[name = tensor<string, []>("op_1849_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_1849_end_mask_0 = const()[name = tensor<string, []>("op_1849_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1849_cast_fp16 = slice_by_index(begin = var_1849_begin_0, end = var_1849_end_0, end_mask = var_1849_end_mask_0, x = value_5_cast_fp16)[name = tensor<string, []>("op_1849_cast_fp16")];
            tensor<int32, [4]> var_1853_begin_0 = const()[name = tensor<string, []>("op_1853_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_1853_end_0 = const()[name = tensor<string, []>("op_1853_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_1853_end_mask_0 = const()[name = tensor<string, []>("op_1853_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1853_cast_fp16 = slice_by_index(begin = var_1853_begin_0, end = var_1853_end_0, end_mask = var_1853_end_mask_0, x = value_5_cast_fp16)[name = tensor<string, []>("op_1853_cast_fp16")];
            tensor<int32, [4]> var_1857_begin_0 = const()[name = tensor<string, []>("op_1857_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_1857_end_0 = const()[name = tensor<string, []>("op_1857_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_1857_end_mask_0 = const()[name = tensor<string, []>("op_1857_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_1857_cast_fp16 = slice_by_index(begin = var_1857_begin_0, end = var_1857_end_0, end_mask = var_1857_end_mask_0, x = value_5_cast_fp16)[name = tensor<string, []>("op_1857_cast_fp16")];
            tensor<string, []> var_1861_equation_0 = const()[name = tensor<string, []>("op_1861_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1861_cast_fp16 = einsum(equation = var_1861_equation_0, values = (var_1799_cast_fp16, var_1577_cast_fp16))[name = tensor<string, []>("op_1861_cast_fp16")];
            tensor<fp16, []> var_1862_to_fp16 = const()[name = tensor<string, []>("op_1862_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_129_cast_fp16 = mul(x = var_1861_cast_fp16, y = var_1862_to_fp16)[name = tensor<string, []>("aw_chunk_129_cast_fp16")];
            tensor<string, []> var_1865_equation_0 = const()[name = tensor<string, []>("op_1865_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1865_cast_fp16 = einsum(equation = var_1865_equation_0, values = (var_1799_cast_fp16, var_1584_cast_fp16))[name = tensor<string, []>("op_1865_cast_fp16")];
            tensor<fp16, []> var_1866_to_fp16 = const()[name = tensor<string, []>("op_1866_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_131_cast_fp16 = mul(x = var_1865_cast_fp16, y = var_1866_to_fp16)[name = tensor<string, []>("aw_chunk_131_cast_fp16")];
            tensor<string, []> var_1869_equation_0 = const()[name = tensor<string, []>("op_1869_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1869_cast_fp16 = einsum(equation = var_1869_equation_0, values = (var_1799_cast_fp16, var_1591_cast_fp16))[name = tensor<string, []>("op_1869_cast_fp16")];
            tensor<fp16, []> var_1870_to_fp16 = const()[name = tensor<string, []>("op_1870_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_133_cast_fp16 = mul(x = var_1869_cast_fp16, y = var_1870_to_fp16)[name = tensor<string, []>("aw_chunk_133_cast_fp16")];
            tensor<string, []> var_1873_equation_0 = const()[name = tensor<string, []>("op_1873_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1873_cast_fp16 = einsum(equation = var_1873_equation_0, values = (var_1799_cast_fp16, var_1598_cast_fp16))[name = tensor<string, []>("op_1873_cast_fp16")];
            tensor<fp16, []> var_1874_to_fp16 = const()[name = tensor<string, []>("op_1874_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_135_cast_fp16 = mul(x = var_1873_cast_fp16, y = var_1874_to_fp16)[name = tensor<string, []>("aw_chunk_135_cast_fp16")];
            tensor<string, []> var_1877_equation_0 = const()[name = tensor<string, []>("op_1877_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1877_cast_fp16 = einsum(equation = var_1877_equation_0, values = (var_1803_cast_fp16, var_1605_cast_fp16))[name = tensor<string, []>("op_1877_cast_fp16")];
            tensor<fp16, []> var_1878_to_fp16 = const()[name = tensor<string, []>("op_1878_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_137_cast_fp16 = mul(x = var_1877_cast_fp16, y = var_1878_to_fp16)[name = tensor<string, []>("aw_chunk_137_cast_fp16")];
            tensor<string, []> var_1881_equation_0 = const()[name = tensor<string, []>("op_1881_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1881_cast_fp16 = einsum(equation = var_1881_equation_0, values = (var_1803_cast_fp16, var_1612_cast_fp16))[name = tensor<string, []>("op_1881_cast_fp16")];
            tensor<fp16, []> var_1882_to_fp16 = const()[name = tensor<string, []>("op_1882_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_139_cast_fp16 = mul(x = var_1881_cast_fp16, y = var_1882_to_fp16)[name = tensor<string, []>("aw_chunk_139_cast_fp16")];
            tensor<string, []> var_1885_equation_0 = const()[name = tensor<string, []>("op_1885_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1885_cast_fp16 = einsum(equation = var_1885_equation_0, values = (var_1803_cast_fp16, var_1619_cast_fp16))[name = tensor<string, []>("op_1885_cast_fp16")];
            tensor<fp16, []> var_1886_to_fp16 = const()[name = tensor<string, []>("op_1886_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_141_cast_fp16 = mul(x = var_1885_cast_fp16, y = var_1886_to_fp16)[name = tensor<string, []>("aw_chunk_141_cast_fp16")];
            tensor<string, []> var_1889_equation_0 = const()[name = tensor<string, []>("op_1889_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1889_cast_fp16 = einsum(equation = var_1889_equation_0, values = (var_1803_cast_fp16, var_1626_cast_fp16))[name = tensor<string, []>("op_1889_cast_fp16")];
            tensor<fp16, []> var_1890_to_fp16 = const()[name = tensor<string, []>("op_1890_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_143_cast_fp16 = mul(x = var_1889_cast_fp16, y = var_1890_to_fp16)[name = tensor<string, []>("aw_chunk_143_cast_fp16")];
            tensor<string, []> var_1893_equation_0 = const()[name = tensor<string, []>("op_1893_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1893_cast_fp16 = einsum(equation = var_1893_equation_0, values = (var_1807_cast_fp16, var_1633_cast_fp16))[name = tensor<string, []>("op_1893_cast_fp16")];
            tensor<fp16, []> var_1894_to_fp16 = const()[name = tensor<string, []>("op_1894_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_145_cast_fp16 = mul(x = var_1893_cast_fp16, y = var_1894_to_fp16)[name = tensor<string, []>("aw_chunk_145_cast_fp16")];
            tensor<string, []> var_1897_equation_0 = const()[name = tensor<string, []>("op_1897_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1897_cast_fp16 = einsum(equation = var_1897_equation_0, values = (var_1807_cast_fp16, var_1640_cast_fp16))[name = tensor<string, []>("op_1897_cast_fp16")];
            tensor<fp16, []> var_1898_to_fp16 = const()[name = tensor<string, []>("op_1898_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_147_cast_fp16 = mul(x = var_1897_cast_fp16, y = var_1898_to_fp16)[name = tensor<string, []>("aw_chunk_147_cast_fp16")];
            tensor<string, []> var_1901_equation_0 = const()[name = tensor<string, []>("op_1901_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1901_cast_fp16 = einsum(equation = var_1901_equation_0, values = (var_1807_cast_fp16, var_1647_cast_fp16))[name = tensor<string, []>("op_1901_cast_fp16")];
            tensor<fp16, []> var_1902_to_fp16 = const()[name = tensor<string, []>("op_1902_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_149_cast_fp16 = mul(x = var_1901_cast_fp16, y = var_1902_to_fp16)[name = tensor<string, []>("aw_chunk_149_cast_fp16")];
            tensor<string, []> var_1905_equation_0 = const()[name = tensor<string, []>("op_1905_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1905_cast_fp16 = einsum(equation = var_1905_equation_0, values = (var_1807_cast_fp16, var_1654_cast_fp16))[name = tensor<string, []>("op_1905_cast_fp16")];
            tensor<fp16, []> var_1906_to_fp16 = const()[name = tensor<string, []>("op_1906_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_151_cast_fp16 = mul(x = var_1905_cast_fp16, y = var_1906_to_fp16)[name = tensor<string, []>("aw_chunk_151_cast_fp16")];
            tensor<string, []> var_1909_equation_0 = const()[name = tensor<string, []>("op_1909_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1909_cast_fp16 = einsum(equation = var_1909_equation_0, values = (var_1811_cast_fp16, var_1661_cast_fp16))[name = tensor<string, []>("op_1909_cast_fp16")];
            tensor<fp16, []> var_1910_to_fp16 = const()[name = tensor<string, []>("op_1910_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_153_cast_fp16 = mul(x = var_1909_cast_fp16, y = var_1910_to_fp16)[name = tensor<string, []>("aw_chunk_153_cast_fp16")];
            tensor<string, []> var_1913_equation_0 = const()[name = tensor<string, []>("op_1913_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1913_cast_fp16 = einsum(equation = var_1913_equation_0, values = (var_1811_cast_fp16, var_1668_cast_fp16))[name = tensor<string, []>("op_1913_cast_fp16")];
            tensor<fp16, []> var_1914_to_fp16 = const()[name = tensor<string, []>("op_1914_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_155_cast_fp16 = mul(x = var_1913_cast_fp16, y = var_1914_to_fp16)[name = tensor<string, []>("aw_chunk_155_cast_fp16")];
            tensor<string, []> var_1917_equation_0 = const()[name = tensor<string, []>("op_1917_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1917_cast_fp16 = einsum(equation = var_1917_equation_0, values = (var_1811_cast_fp16, var_1675_cast_fp16))[name = tensor<string, []>("op_1917_cast_fp16")];
            tensor<fp16, []> var_1918_to_fp16 = const()[name = tensor<string, []>("op_1918_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_157_cast_fp16 = mul(x = var_1917_cast_fp16, y = var_1918_to_fp16)[name = tensor<string, []>("aw_chunk_157_cast_fp16")];
            tensor<string, []> var_1921_equation_0 = const()[name = tensor<string, []>("op_1921_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1921_cast_fp16 = einsum(equation = var_1921_equation_0, values = (var_1811_cast_fp16, var_1682_cast_fp16))[name = tensor<string, []>("op_1921_cast_fp16")];
            tensor<fp16, []> var_1922_to_fp16 = const()[name = tensor<string, []>("op_1922_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_159_cast_fp16 = mul(x = var_1921_cast_fp16, y = var_1922_to_fp16)[name = tensor<string, []>("aw_chunk_159_cast_fp16")];
            tensor<string, []> var_1925_equation_0 = const()[name = tensor<string, []>("op_1925_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1925_cast_fp16 = einsum(equation = var_1925_equation_0, values = (var_1815_cast_fp16, var_1689_cast_fp16))[name = tensor<string, []>("op_1925_cast_fp16")];
            tensor<fp16, []> var_1926_to_fp16 = const()[name = tensor<string, []>("op_1926_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_161_cast_fp16 = mul(x = var_1925_cast_fp16, y = var_1926_to_fp16)[name = tensor<string, []>("aw_chunk_161_cast_fp16")];
            tensor<string, []> var_1929_equation_0 = const()[name = tensor<string, []>("op_1929_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1929_cast_fp16 = einsum(equation = var_1929_equation_0, values = (var_1815_cast_fp16, var_1696_cast_fp16))[name = tensor<string, []>("op_1929_cast_fp16")];
            tensor<fp16, []> var_1930_to_fp16 = const()[name = tensor<string, []>("op_1930_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_163_cast_fp16 = mul(x = var_1929_cast_fp16, y = var_1930_to_fp16)[name = tensor<string, []>("aw_chunk_163_cast_fp16")];
            tensor<string, []> var_1933_equation_0 = const()[name = tensor<string, []>("op_1933_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1933_cast_fp16 = einsum(equation = var_1933_equation_0, values = (var_1815_cast_fp16, var_1703_cast_fp16))[name = tensor<string, []>("op_1933_cast_fp16")];
            tensor<fp16, []> var_1934_to_fp16 = const()[name = tensor<string, []>("op_1934_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_165_cast_fp16 = mul(x = var_1933_cast_fp16, y = var_1934_to_fp16)[name = tensor<string, []>("aw_chunk_165_cast_fp16")];
            tensor<string, []> var_1937_equation_0 = const()[name = tensor<string, []>("op_1937_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1937_cast_fp16 = einsum(equation = var_1937_equation_0, values = (var_1815_cast_fp16, var_1710_cast_fp16))[name = tensor<string, []>("op_1937_cast_fp16")];
            tensor<fp16, []> var_1938_to_fp16 = const()[name = tensor<string, []>("op_1938_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_167_cast_fp16 = mul(x = var_1937_cast_fp16, y = var_1938_to_fp16)[name = tensor<string, []>("aw_chunk_167_cast_fp16")];
            tensor<string, []> var_1941_equation_0 = const()[name = tensor<string, []>("op_1941_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1941_cast_fp16 = einsum(equation = var_1941_equation_0, values = (var_1819_cast_fp16, var_1717_cast_fp16))[name = tensor<string, []>("op_1941_cast_fp16")];
            tensor<fp16, []> var_1942_to_fp16 = const()[name = tensor<string, []>("op_1942_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_169_cast_fp16 = mul(x = var_1941_cast_fp16, y = var_1942_to_fp16)[name = tensor<string, []>("aw_chunk_169_cast_fp16")];
            tensor<string, []> var_1945_equation_0 = const()[name = tensor<string, []>("op_1945_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1945_cast_fp16 = einsum(equation = var_1945_equation_0, values = (var_1819_cast_fp16, var_1724_cast_fp16))[name = tensor<string, []>("op_1945_cast_fp16")];
            tensor<fp16, []> var_1946_to_fp16 = const()[name = tensor<string, []>("op_1946_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_171_cast_fp16 = mul(x = var_1945_cast_fp16, y = var_1946_to_fp16)[name = tensor<string, []>("aw_chunk_171_cast_fp16")];
            tensor<string, []> var_1949_equation_0 = const()[name = tensor<string, []>("op_1949_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1949_cast_fp16 = einsum(equation = var_1949_equation_0, values = (var_1819_cast_fp16, var_1731_cast_fp16))[name = tensor<string, []>("op_1949_cast_fp16")];
            tensor<fp16, []> var_1950_to_fp16 = const()[name = tensor<string, []>("op_1950_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_173_cast_fp16 = mul(x = var_1949_cast_fp16, y = var_1950_to_fp16)[name = tensor<string, []>("aw_chunk_173_cast_fp16")];
            tensor<string, []> var_1953_equation_0 = const()[name = tensor<string, []>("op_1953_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1953_cast_fp16 = einsum(equation = var_1953_equation_0, values = (var_1819_cast_fp16, var_1738_cast_fp16))[name = tensor<string, []>("op_1953_cast_fp16")];
            tensor<fp16, []> var_1954_to_fp16 = const()[name = tensor<string, []>("op_1954_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_175_cast_fp16 = mul(x = var_1953_cast_fp16, y = var_1954_to_fp16)[name = tensor<string, []>("aw_chunk_175_cast_fp16")];
            tensor<string, []> var_1957_equation_0 = const()[name = tensor<string, []>("op_1957_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1957_cast_fp16 = einsum(equation = var_1957_equation_0, values = (var_1823_cast_fp16, var_1745_cast_fp16))[name = tensor<string, []>("op_1957_cast_fp16")];
            tensor<fp16, []> var_1958_to_fp16 = const()[name = tensor<string, []>("op_1958_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_177_cast_fp16 = mul(x = var_1957_cast_fp16, y = var_1958_to_fp16)[name = tensor<string, []>("aw_chunk_177_cast_fp16")];
            tensor<string, []> var_1961_equation_0 = const()[name = tensor<string, []>("op_1961_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1961_cast_fp16 = einsum(equation = var_1961_equation_0, values = (var_1823_cast_fp16, var_1752_cast_fp16))[name = tensor<string, []>("op_1961_cast_fp16")];
            tensor<fp16, []> var_1962_to_fp16 = const()[name = tensor<string, []>("op_1962_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_179_cast_fp16 = mul(x = var_1961_cast_fp16, y = var_1962_to_fp16)[name = tensor<string, []>("aw_chunk_179_cast_fp16")];
            tensor<string, []> var_1965_equation_0 = const()[name = tensor<string, []>("op_1965_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1965_cast_fp16 = einsum(equation = var_1965_equation_0, values = (var_1823_cast_fp16, var_1759_cast_fp16))[name = tensor<string, []>("op_1965_cast_fp16")];
            tensor<fp16, []> var_1966_to_fp16 = const()[name = tensor<string, []>("op_1966_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_181_cast_fp16 = mul(x = var_1965_cast_fp16, y = var_1966_to_fp16)[name = tensor<string, []>("aw_chunk_181_cast_fp16")];
            tensor<string, []> var_1969_equation_0 = const()[name = tensor<string, []>("op_1969_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1969_cast_fp16 = einsum(equation = var_1969_equation_0, values = (var_1823_cast_fp16, var_1766_cast_fp16))[name = tensor<string, []>("op_1969_cast_fp16")];
            tensor<fp16, []> var_1970_to_fp16 = const()[name = tensor<string, []>("op_1970_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_183_cast_fp16 = mul(x = var_1969_cast_fp16, y = var_1970_to_fp16)[name = tensor<string, []>("aw_chunk_183_cast_fp16")];
            tensor<string, []> var_1973_equation_0 = const()[name = tensor<string, []>("op_1973_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1973_cast_fp16 = einsum(equation = var_1973_equation_0, values = (var_1827_cast_fp16, var_1773_cast_fp16))[name = tensor<string, []>("op_1973_cast_fp16")];
            tensor<fp16, []> var_1974_to_fp16 = const()[name = tensor<string, []>("op_1974_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_185_cast_fp16 = mul(x = var_1973_cast_fp16, y = var_1974_to_fp16)[name = tensor<string, []>("aw_chunk_185_cast_fp16")];
            tensor<string, []> var_1977_equation_0 = const()[name = tensor<string, []>("op_1977_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1977_cast_fp16 = einsum(equation = var_1977_equation_0, values = (var_1827_cast_fp16, var_1780_cast_fp16))[name = tensor<string, []>("op_1977_cast_fp16")];
            tensor<fp16, []> var_1978_to_fp16 = const()[name = tensor<string, []>("op_1978_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_187_cast_fp16 = mul(x = var_1977_cast_fp16, y = var_1978_to_fp16)[name = tensor<string, []>("aw_chunk_187_cast_fp16")];
            tensor<string, []> var_1981_equation_0 = const()[name = tensor<string, []>("op_1981_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1981_cast_fp16 = einsum(equation = var_1981_equation_0, values = (var_1827_cast_fp16, var_1787_cast_fp16))[name = tensor<string, []>("op_1981_cast_fp16")];
            tensor<fp16, []> var_1982_to_fp16 = const()[name = tensor<string, []>("op_1982_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_189_cast_fp16 = mul(x = var_1981_cast_fp16, y = var_1982_to_fp16)[name = tensor<string, []>("aw_chunk_189_cast_fp16")];
            tensor<string, []> var_1985_equation_0 = const()[name = tensor<string, []>("op_1985_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_1985_cast_fp16 = einsum(equation = var_1985_equation_0, values = (var_1827_cast_fp16, var_1794_cast_fp16))[name = tensor<string, []>("op_1985_cast_fp16")];
            tensor<fp16, []> var_1986_to_fp16 = const()[name = tensor<string, []>("op_1986_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_191_cast_fp16 = mul(x = var_1985_cast_fp16, y = var_1986_to_fp16)[name = tensor<string, []>("aw_chunk_191_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1988_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_129_cast_fp16)[name = tensor<string, []>("op_1988_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1989_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_131_cast_fp16)[name = tensor<string, []>("op_1989_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1990_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_133_cast_fp16)[name = tensor<string, []>("op_1990_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1991_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_135_cast_fp16)[name = tensor<string, []>("op_1991_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1992_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_137_cast_fp16)[name = tensor<string, []>("op_1992_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1993_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_139_cast_fp16)[name = tensor<string, []>("op_1993_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1994_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_141_cast_fp16)[name = tensor<string, []>("op_1994_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1995_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_143_cast_fp16)[name = tensor<string, []>("op_1995_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1996_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_145_cast_fp16)[name = tensor<string, []>("op_1996_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1997_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_147_cast_fp16)[name = tensor<string, []>("op_1997_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1998_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_149_cast_fp16)[name = tensor<string, []>("op_1998_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_1999_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_151_cast_fp16)[name = tensor<string, []>("op_1999_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2000_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_153_cast_fp16)[name = tensor<string, []>("op_2000_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2001_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_155_cast_fp16)[name = tensor<string, []>("op_2001_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2002_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_157_cast_fp16)[name = tensor<string, []>("op_2002_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2003_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_159_cast_fp16)[name = tensor<string, []>("op_2003_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2004_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_161_cast_fp16)[name = tensor<string, []>("op_2004_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2005_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_163_cast_fp16)[name = tensor<string, []>("op_2005_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2006_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_165_cast_fp16)[name = tensor<string, []>("op_2006_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2007_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_167_cast_fp16)[name = tensor<string, []>("op_2007_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2008_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_169_cast_fp16)[name = tensor<string, []>("op_2008_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2009_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_171_cast_fp16)[name = tensor<string, []>("op_2009_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2010_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_173_cast_fp16)[name = tensor<string, []>("op_2010_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2011_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_175_cast_fp16)[name = tensor<string, []>("op_2011_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2012_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_177_cast_fp16)[name = tensor<string, []>("op_2012_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2013_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_179_cast_fp16)[name = tensor<string, []>("op_2013_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2014_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_181_cast_fp16)[name = tensor<string, []>("op_2014_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2015_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_183_cast_fp16)[name = tensor<string, []>("op_2015_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2016_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_185_cast_fp16)[name = tensor<string, []>("op_2016_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2017_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_187_cast_fp16)[name = tensor<string, []>("op_2017_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2018_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_189_cast_fp16)[name = tensor<string, []>("op_2018_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2019_cast_fp16 = softmax(axis = var_1485, x = aw_chunk_191_cast_fp16)[name = tensor<string, []>("op_2019_cast_fp16")];
            tensor<string, []> var_2021_equation_0 = const()[name = tensor<string, []>("op_2021_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2021_cast_fp16 = einsum(equation = var_2021_equation_0, values = (var_1829_cast_fp16, var_1988_cast_fp16))[name = tensor<string, []>("op_2021_cast_fp16")];
            tensor<string, []> var_2023_equation_0 = const()[name = tensor<string, []>("op_2023_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2023_cast_fp16 = einsum(equation = var_2023_equation_0, values = (var_1829_cast_fp16, var_1989_cast_fp16))[name = tensor<string, []>("op_2023_cast_fp16")];
            tensor<string, []> var_2025_equation_0 = const()[name = tensor<string, []>("op_2025_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2025_cast_fp16 = einsum(equation = var_2025_equation_0, values = (var_1829_cast_fp16, var_1990_cast_fp16))[name = tensor<string, []>("op_2025_cast_fp16")];
            tensor<string, []> var_2027_equation_0 = const()[name = tensor<string, []>("op_2027_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2027_cast_fp16 = einsum(equation = var_2027_equation_0, values = (var_1829_cast_fp16, var_1991_cast_fp16))[name = tensor<string, []>("op_2027_cast_fp16")];
            tensor<string, []> var_2029_equation_0 = const()[name = tensor<string, []>("op_2029_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2029_cast_fp16 = einsum(equation = var_2029_equation_0, values = (var_1833_cast_fp16, var_1992_cast_fp16))[name = tensor<string, []>("op_2029_cast_fp16")];
            tensor<string, []> var_2031_equation_0 = const()[name = tensor<string, []>("op_2031_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2031_cast_fp16 = einsum(equation = var_2031_equation_0, values = (var_1833_cast_fp16, var_1993_cast_fp16))[name = tensor<string, []>("op_2031_cast_fp16")];
            tensor<string, []> var_2033_equation_0 = const()[name = tensor<string, []>("op_2033_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2033_cast_fp16 = einsum(equation = var_2033_equation_0, values = (var_1833_cast_fp16, var_1994_cast_fp16))[name = tensor<string, []>("op_2033_cast_fp16")];
            tensor<string, []> var_2035_equation_0 = const()[name = tensor<string, []>("op_2035_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2035_cast_fp16 = einsum(equation = var_2035_equation_0, values = (var_1833_cast_fp16, var_1995_cast_fp16))[name = tensor<string, []>("op_2035_cast_fp16")];
            tensor<string, []> var_2037_equation_0 = const()[name = tensor<string, []>("op_2037_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2037_cast_fp16 = einsum(equation = var_2037_equation_0, values = (var_1837_cast_fp16, var_1996_cast_fp16))[name = tensor<string, []>("op_2037_cast_fp16")];
            tensor<string, []> var_2039_equation_0 = const()[name = tensor<string, []>("op_2039_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2039_cast_fp16 = einsum(equation = var_2039_equation_0, values = (var_1837_cast_fp16, var_1997_cast_fp16))[name = tensor<string, []>("op_2039_cast_fp16")];
            tensor<string, []> var_2041_equation_0 = const()[name = tensor<string, []>("op_2041_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2041_cast_fp16 = einsum(equation = var_2041_equation_0, values = (var_1837_cast_fp16, var_1998_cast_fp16))[name = tensor<string, []>("op_2041_cast_fp16")];
            tensor<string, []> var_2043_equation_0 = const()[name = tensor<string, []>("op_2043_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2043_cast_fp16 = einsum(equation = var_2043_equation_0, values = (var_1837_cast_fp16, var_1999_cast_fp16))[name = tensor<string, []>("op_2043_cast_fp16")];
            tensor<string, []> var_2045_equation_0 = const()[name = tensor<string, []>("op_2045_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2045_cast_fp16 = einsum(equation = var_2045_equation_0, values = (var_1841_cast_fp16, var_2000_cast_fp16))[name = tensor<string, []>("op_2045_cast_fp16")];
            tensor<string, []> var_2047_equation_0 = const()[name = tensor<string, []>("op_2047_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2047_cast_fp16 = einsum(equation = var_2047_equation_0, values = (var_1841_cast_fp16, var_2001_cast_fp16))[name = tensor<string, []>("op_2047_cast_fp16")];
            tensor<string, []> var_2049_equation_0 = const()[name = tensor<string, []>("op_2049_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2049_cast_fp16 = einsum(equation = var_2049_equation_0, values = (var_1841_cast_fp16, var_2002_cast_fp16))[name = tensor<string, []>("op_2049_cast_fp16")];
            tensor<string, []> var_2051_equation_0 = const()[name = tensor<string, []>("op_2051_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2051_cast_fp16 = einsum(equation = var_2051_equation_0, values = (var_1841_cast_fp16, var_2003_cast_fp16))[name = tensor<string, []>("op_2051_cast_fp16")];
            tensor<string, []> var_2053_equation_0 = const()[name = tensor<string, []>("op_2053_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2053_cast_fp16 = einsum(equation = var_2053_equation_0, values = (var_1845_cast_fp16, var_2004_cast_fp16))[name = tensor<string, []>("op_2053_cast_fp16")];
            tensor<string, []> var_2055_equation_0 = const()[name = tensor<string, []>("op_2055_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2055_cast_fp16 = einsum(equation = var_2055_equation_0, values = (var_1845_cast_fp16, var_2005_cast_fp16))[name = tensor<string, []>("op_2055_cast_fp16")];
            tensor<string, []> var_2057_equation_0 = const()[name = tensor<string, []>("op_2057_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2057_cast_fp16 = einsum(equation = var_2057_equation_0, values = (var_1845_cast_fp16, var_2006_cast_fp16))[name = tensor<string, []>("op_2057_cast_fp16")];
            tensor<string, []> var_2059_equation_0 = const()[name = tensor<string, []>("op_2059_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2059_cast_fp16 = einsum(equation = var_2059_equation_0, values = (var_1845_cast_fp16, var_2007_cast_fp16))[name = tensor<string, []>("op_2059_cast_fp16")];
            tensor<string, []> var_2061_equation_0 = const()[name = tensor<string, []>("op_2061_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2061_cast_fp16 = einsum(equation = var_2061_equation_0, values = (var_1849_cast_fp16, var_2008_cast_fp16))[name = tensor<string, []>("op_2061_cast_fp16")];
            tensor<string, []> var_2063_equation_0 = const()[name = tensor<string, []>("op_2063_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2063_cast_fp16 = einsum(equation = var_2063_equation_0, values = (var_1849_cast_fp16, var_2009_cast_fp16))[name = tensor<string, []>("op_2063_cast_fp16")];
            tensor<string, []> var_2065_equation_0 = const()[name = tensor<string, []>("op_2065_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2065_cast_fp16 = einsum(equation = var_2065_equation_0, values = (var_1849_cast_fp16, var_2010_cast_fp16))[name = tensor<string, []>("op_2065_cast_fp16")];
            tensor<string, []> var_2067_equation_0 = const()[name = tensor<string, []>("op_2067_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2067_cast_fp16 = einsum(equation = var_2067_equation_0, values = (var_1849_cast_fp16, var_2011_cast_fp16))[name = tensor<string, []>("op_2067_cast_fp16")];
            tensor<string, []> var_2069_equation_0 = const()[name = tensor<string, []>("op_2069_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2069_cast_fp16 = einsum(equation = var_2069_equation_0, values = (var_1853_cast_fp16, var_2012_cast_fp16))[name = tensor<string, []>("op_2069_cast_fp16")];
            tensor<string, []> var_2071_equation_0 = const()[name = tensor<string, []>("op_2071_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2071_cast_fp16 = einsum(equation = var_2071_equation_0, values = (var_1853_cast_fp16, var_2013_cast_fp16))[name = tensor<string, []>("op_2071_cast_fp16")];
            tensor<string, []> var_2073_equation_0 = const()[name = tensor<string, []>("op_2073_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2073_cast_fp16 = einsum(equation = var_2073_equation_0, values = (var_1853_cast_fp16, var_2014_cast_fp16))[name = tensor<string, []>("op_2073_cast_fp16")];
            tensor<string, []> var_2075_equation_0 = const()[name = tensor<string, []>("op_2075_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2075_cast_fp16 = einsum(equation = var_2075_equation_0, values = (var_1853_cast_fp16, var_2015_cast_fp16))[name = tensor<string, []>("op_2075_cast_fp16")];
            tensor<string, []> var_2077_equation_0 = const()[name = tensor<string, []>("op_2077_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2077_cast_fp16 = einsum(equation = var_2077_equation_0, values = (var_1857_cast_fp16, var_2016_cast_fp16))[name = tensor<string, []>("op_2077_cast_fp16")];
            tensor<string, []> var_2079_equation_0 = const()[name = tensor<string, []>("op_2079_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2079_cast_fp16 = einsum(equation = var_2079_equation_0, values = (var_1857_cast_fp16, var_2017_cast_fp16))[name = tensor<string, []>("op_2079_cast_fp16")];
            tensor<string, []> var_2081_equation_0 = const()[name = tensor<string, []>("op_2081_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2081_cast_fp16 = einsum(equation = var_2081_equation_0, values = (var_1857_cast_fp16, var_2018_cast_fp16))[name = tensor<string, []>("op_2081_cast_fp16")];
            tensor<string, []> var_2083_equation_0 = const()[name = tensor<string, []>("op_2083_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2083_cast_fp16 = einsum(equation = var_2083_equation_0, values = (var_1857_cast_fp16, var_2019_cast_fp16))[name = tensor<string, []>("op_2083_cast_fp16")];
            tensor<bool, []> var_2085_interleave_0 = const()[name = tensor<string, []>("op_2085_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2085_cast_fp16 = concat(axis = var_1472, interleave = var_2085_interleave_0, values = (var_2021_cast_fp16, var_2023_cast_fp16, var_2025_cast_fp16, var_2027_cast_fp16))[name = tensor<string, []>("op_2085_cast_fp16")];
            tensor<bool, []> var_2087_interleave_0 = const()[name = tensor<string, []>("op_2087_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2087_cast_fp16 = concat(axis = var_1472, interleave = var_2087_interleave_0, values = (var_2029_cast_fp16, var_2031_cast_fp16, var_2033_cast_fp16, var_2035_cast_fp16))[name = tensor<string, []>("op_2087_cast_fp16")];
            tensor<bool, []> var_2089_interleave_0 = const()[name = tensor<string, []>("op_2089_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2089_cast_fp16 = concat(axis = var_1472, interleave = var_2089_interleave_0, values = (var_2037_cast_fp16, var_2039_cast_fp16, var_2041_cast_fp16, var_2043_cast_fp16))[name = tensor<string, []>("op_2089_cast_fp16")];
            tensor<bool, []> var_2091_interleave_0 = const()[name = tensor<string, []>("op_2091_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2091_cast_fp16 = concat(axis = var_1472, interleave = var_2091_interleave_0, values = (var_2045_cast_fp16, var_2047_cast_fp16, var_2049_cast_fp16, var_2051_cast_fp16))[name = tensor<string, []>("op_2091_cast_fp16")];
            tensor<bool, []> var_2093_interleave_0 = const()[name = tensor<string, []>("op_2093_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2093_cast_fp16 = concat(axis = var_1472, interleave = var_2093_interleave_0, values = (var_2053_cast_fp16, var_2055_cast_fp16, var_2057_cast_fp16, var_2059_cast_fp16))[name = tensor<string, []>("op_2093_cast_fp16")];
            tensor<bool, []> var_2095_interleave_0 = const()[name = tensor<string, []>("op_2095_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2095_cast_fp16 = concat(axis = var_1472, interleave = var_2095_interleave_0, values = (var_2061_cast_fp16, var_2063_cast_fp16, var_2065_cast_fp16, var_2067_cast_fp16))[name = tensor<string, []>("op_2095_cast_fp16")];
            tensor<bool, []> var_2097_interleave_0 = const()[name = tensor<string, []>("op_2097_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2097_cast_fp16 = concat(axis = var_1472, interleave = var_2097_interleave_0, values = (var_2069_cast_fp16, var_2071_cast_fp16, var_2073_cast_fp16, var_2075_cast_fp16))[name = tensor<string, []>("op_2097_cast_fp16")];
            tensor<bool, []> var_2099_interleave_0 = const()[name = tensor<string, []>("op_2099_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2099_cast_fp16 = concat(axis = var_1472, interleave = var_2099_interleave_0, values = (var_2077_cast_fp16, var_2079_cast_fp16, var_2081_cast_fp16, var_2083_cast_fp16))[name = tensor<string, []>("op_2099_cast_fp16")];
            tensor<bool, []> input_17_interleave_0 = const()[name = tensor<string, []>("input_17_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 512, 1, 1500]> input_17_cast_fp16 = concat(axis = var_1485, interleave = input_17_interleave_0, values = (var_2085_cast_fp16, var_2087_cast_fp16, var_2089_cast_fp16, var_2091_cast_fp16, var_2093_cast_fp16, var_2095_cast_fp16, var_2097_cast_fp16, var_2099_cast_fp16))[name = tensor<string, []>("input_17_cast_fp16")];
            tensor<int32, [2]> var_2104 = const()[name = tensor<string, []>("op_2104"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2106 = const()[name = tensor<string, []>("op_2106"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_11_pad_type_0 = const()[name = tensor<string, []>("obj_11_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_11_pad_0 = const()[name = tensor<string, []>("obj_11_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_2_self_attn_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_o_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(17546048)))];
            tensor<fp16, [512]> layers_2_self_attn_o_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_self_attn_o_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(18070400)))];
            tensor<fp16, [1, 512, 1, 1500]> obj_11_cast_fp16 = conv(bias = layers_2_self_attn_o_proj_bias_to_fp16, dilations = var_2106, groups = var_1485, pad = obj_11_pad_0, pad_type = obj_11_pad_type_0, strides = var_2104, weight = layers_2_self_attn_o_proj_weight_to_fp16, x = input_17_cast_fp16)[name = tensor<string, []>("obj_11_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_11_cast_fp16 = add(x = inputs_9_cast_fp16, y = obj_11_cast_fp16)[name = tensor<string, []>("inputs_11_cast_fp16")];
            tensor<int32, [1]> var_2112 = const()[name = tensor<string, []>("op_2112"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_11_cast_fp16 = reduce_mean(axes = var_2112, keep_dims = var_1486, x = inputs_11_cast_fp16)[name = tensor<string, []>("channels_mean_11_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_11_cast_fp16 = sub(x = inputs_11_cast_fp16, y = channels_mean_11_cast_fp16)[name = tensor<string, []>("zero_mean_11_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_11_cast_fp16 = mul(x = zero_mean_11_cast_fp16, y = zero_mean_11_cast_fp16)[name = tensor<string, []>("zero_mean_sq_11_cast_fp16")];
            tensor<int32, [1]> var_2116 = const()[name = tensor<string, []>("op_2116"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_2117_cast_fp16 = reduce_mean(axes = var_2116, keep_dims = var_1486, x = zero_mean_sq_11_cast_fp16)[name = tensor<string, []>("op_2117_cast_fp16")];
            tensor<fp16, []> var_2118_to_fp16 = const()[name = tensor<string, []>("op_2118_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_2119_cast_fp16 = add(x = var_2117_cast_fp16, y = var_2118_to_fp16)[name = tensor<string, []>("op_2119_cast_fp16")];
            tensor<fp16, []> denom_11_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_11_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_11_cast_fp16 = rsqrt(epsilon = denom_11_epsilon_0_to_fp16, x = var_2119_cast_fp16)[name = tensor<string, []>("denom_11_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_11_cast_fp16 = mul(x = zero_mean_11_cast_fp16, y = denom_11_cast_fp16)[name = tensor<string, []>("out_11_cast_fp16")];
            tensor<fp16, [512]> input_19_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_19_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(18071488)))];
            tensor<fp16, [512]> input_19_beta_0_to_fp16 = const()[name = tensor<string, []>("input_19_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(18072576)))];
            tensor<fp16, []> input_19_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_19_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> input_19_cast_fp16 = batch_norm(beta = input_19_beta_0_to_fp16, epsilon = input_19_epsilon_0_to_fp16, gamma = input_19_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_11_cast_fp16)[name = tensor<string, []>("input_19_cast_fp16")];
            tensor<int32, [2]> var_2130 = const()[name = tensor<string, []>("op_2130"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2132 = const()[name = tensor<string, []>("op_2132"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> input_21_pad_type_0 = const()[name = tensor<string, []>("input_21_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> input_21_pad_0 = const()[name = tensor<string, []>("input_21_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [2048, 512, 1, 1]> layers_2_fc1_weight_to_fp16 = const()[name = tensor<string, []>("layers_2_fc1_weight_to_fp16"), val = tensor<fp16, [2048, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(18073664)))];
            tensor<fp16, [2048]> layers_2_fc1_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_fc1_bias_to_fp16"), val = tensor<fp16, [2048]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20170880)))];
            tensor<fp16, [1, 2048, 1, 1500]> input_21_cast_fp16 = conv(bias = layers_2_fc1_bias_to_fp16, dilations = var_2132, groups = var_1485, pad = input_21_pad_0, pad_type = input_21_pad_type_0, strides = var_2130, weight = layers_2_fc1_weight_to_fp16, x = input_19_cast_fp16)[name = tensor<string, []>("input_21_cast_fp16")];
            tensor<string, []> input_23_mode_0 = const()[name = tensor<string, []>("input_23_mode_0"), val = tensor<string, []>("EXACT")];
            tensor<fp16, [1, 2048, 1, 1500]> input_23_cast_fp16 = gelu(mode = input_23_mode_0, x = input_21_cast_fp16)[name = tensor<string, []>("input_23_cast_fp16")];
            tensor<int32, [2]> var_2138 = const()[name = tensor<string, []>("op_2138"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2140 = const()[name = tensor<string, []>("op_2140"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> hidden_states_9_pad_type_0 = const()[name = tensor<string, []>("hidden_states_9_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> hidden_states_9_pad_0 = const()[name = tensor<string, []>("hidden_states_9_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 2048, 1, 1]> layers_2_fc2_weight_to_fp16 = const()[name = tensor<string, []>("layers_2_fc2_weight_to_fp16"), val = tensor<fp16, [512, 2048, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(20175040)))];
            tensor<fp16, [512]> layers_2_fc2_bias_to_fp16 = const()[name = tensor<string, []>("layers_2_fc2_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22272256)))];
            tensor<fp16, [1, 512, 1, 1500]> hidden_states_9_cast_fp16 = conv(bias = layers_2_fc2_bias_to_fp16, dilations = var_2140, groups = var_1485, pad = hidden_states_9_pad_0, pad_type = hidden_states_9_pad_type_0, strides = var_2138, weight = layers_2_fc2_weight_to_fp16, x = input_23_cast_fp16)[name = tensor<string, []>("hidden_states_9_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_13_cast_fp16 = add(x = inputs_11_cast_fp16, y = hidden_states_9_cast_fp16)[name = tensor<string, []>("inputs_13_cast_fp16")];
            tensor<int32, []> var_2147 = const()[name = tensor<string, []>("op_2147"), val = tensor<int32, []>(3)];
            tensor<int32, []> var_2160 = const()[name = tensor<string, []>("op_2160"), val = tensor<int32, []>(1)];
            tensor<bool, []> var_2161 = const()[name = tensor<string, []>("op_2161"), val = tensor<bool, []>(true)];
            tensor<int32, [1]> var_2171 = const()[name = tensor<string, []>("op_2171"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_13_cast_fp16 = reduce_mean(axes = var_2171, keep_dims = var_2161, x = inputs_13_cast_fp16)[name = tensor<string, []>("channels_mean_13_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_13_cast_fp16 = sub(x = inputs_13_cast_fp16, y = channels_mean_13_cast_fp16)[name = tensor<string, []>("zero_mean_13_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_13_cast_fp16 = mul(x = zero_mean_13_cast_fp16, y = zero_mean_13_cast_fp16)[name = tensor<string, []>("zero_mean_sq_13_cast_fp16")];
            tensor<int32, [1]> var_2175 = const()[name = tensor<string, []>("op_2175"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_2176_cast_fp16 = reduce_mean(axes = var_2175, keep_dims = var_2161, x = zero_mean_sq_13_cast_fp16)[name = tensor<string, []>("op_2176_cast_fp16")];
            tensor<fp16, []> var_2177_to_fp16 = const()[name = tensor<string, []>("op_2177_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_2178_cast_fp16 = add(x = var_2176_cast_fp16, y = var_2177_to_fp16)[name = tensor<string, []>("op_2178_cast_fp16")];
            tensor<fp16, []> denom_13_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_13_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_13_cast_fp16 = rsqrt(epsilon = denom_13_epsilon_0_to_fp16, x = var_2178_cast_fp16)[name = tensor<string, []>("denom_13_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_13_cast_fp16 = mul(x = zero_mean_13_cast_fp16, y = denom_13_cast_fp16)[name = tensor<string, []>("out_13_cast_fp16")];
            tensor<fp16, [512]> obj_13_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_13_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22273344)))];
            tensor<fp16, [512]> obj_13_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_13_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22274432)))];
            tensor<fp16, []> obj_13_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_13_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> obj_13_cast_fp16 = batch_norm(beta = obj_13_beta_0_to_fp16, epsilon = obj_13_epsilon_0_to_fp16, gamma = obj_13_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_13_cast_fp16)[name = tensor<string, []>("obj_13_cast_fp16")];
            tensor<int32, [2]> var_2193 = const()[name = tensor<string, []>("op_2193"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2195 = const()[name = tensor<string, []>("op_2195"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_7_pad_type_0 = const()[name = tensor<string, []>("query_7_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_7_pad_0 = const()[name = tensor<string, []>("query_7_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_3_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22275520)))];
            tensor<fp16, [512]> layers_3_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22799872)))];
            tensor<fp16, [1, 512, 1, 1500]> query_7_cast_fp16 = conv(bias = layers_3_self_attn_q_proj_bias_to_fp16, dilations = var_2195, groups = var_2160, pad = query_7_pad_0, pad_type = query_7_pad_type_0, strides = var_2193, weight = layers_3_self_attn_q_proj_weight_to_fp16, x = obj_13_cast_fp16)[name = tensor<string, []>("query_7_cast_fp16")];
            tensor<int32, [2]> var_2199 = const()[name = tensor<string, []>("op_2199"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2201 = const()[name = tensor<string, []>("op_2201"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_7_pad_type_0 = const()[name = tensor<string, []>("key_7_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_7_pad_0 = const()[name = tensor<string, []>("key_7_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_3_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(22800960)))];
            tensor<fp16, [1, 512, 1, 1500]> key_7_cast_fp16 = conv(dilations = var_2201, groups = var_2160, pad = key_7_pad_0, pad_type = key_7_pad_type_0, strides = var_2199, weight = layers_3_self_attn_k_proj_weight_to_fp16, x = obj_13_cast_fp16)[name = tensor<string, []>("key_7_cast_fp16")];
            tensor<int32, [2]> var_2206 = const()[name = tensor<string, []>("op_2206"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2208 = const()[name = tensor<string, []>("op_2208"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_7_pad_type_0 = const()[name = tensor<string, []>("value_7_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_7_pad_0 = const()[name = tensor<string, []>("value_7_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_3_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(23325312)))];
            tensor<fp16, [512]> layers_3_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(23849664)))];
            tensor<fp16, [1, 512, 1, 1500]> value_7_cast_fp16 = conv(bias = layers_3_self_attn_v_proj_bias_to_fp16, dilations = var_2208, groups = var_2160, pad = value_7_pad_0, pad_type = value_7_pad_type_0, strides = var_2206, weight = layers_3_self_attn_v_proj_weight_to_fp16, x = obj_13_cast_fp16)[name = tensor<string, []>("value_7_cast_fp16")];
            tensor<int32, [4]> var_2215_begin_0 = const()[name = tensor<string, []>("op_2215_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2215_end_0 = const()[name = tensor<string, []>("op_2215_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2215_end_mask_0 = const()[name = tensor<string, []>("op_2215_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2215_cast_fp16 = slice_by_index(begin = var_2215_begin_0, end = var_2215_end_0, end_mask = var_2215_end_mask_0, x = query_7_cast_fp16)[name = tensor<string, []>("op_2215_cast_fp16")];
            tensor<int32, [4]> var_2219_begin_0 = const()[name = tensor<string, []>("op_2219_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_2219_end_0 = const()[name = tensor<string, []>("op_2219_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_2219_end_mask_0 = const()[name = tensor<string, []>("op_2219_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2219_cast_fp16 = slice_by_index(begin = var_2219_begin_0, end = var_2219_end_0, end_mask = var_2219_end_mask_0, x = query_7_cast_fp16)[name = tensor<string, []>("op_2219_cast_fp16")];
            tensor<int32, [4]> var_2223_begin_0 = const()[name = tensor<string, []>("op_2223_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_2223_end_0 = const()[name = tensor<string, []>("op_2223_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_2223_end_mask_0 = const()[name = tensor<string, []>("op_2223_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2223_cast_fp16 = slice_by_index(begin = var_2223_begin_0, end = var_2223_end_0, end_mask = var_2223_end_mask_0, x = query_7_cast_fp16)[name = tensor<string, []>("op_2223_cast_fp16")];
            tensor<int32, [4]> var_2227_begin_0 = const()[name = tensor<string, []>("op_2227_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_2227_end_0 = const()[name = tensor<string, []>("op_2227_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_2227_end_mask_0 = const()[name = tensor<string, []>("op_2227_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2227_cast_fp16 = slice_by_index(begin = var_2227_begin_0, end = var_2227_end_0, end_mask = var_2227_end_mask_0, x = query_7_cast_fp16)[name = tensor<string, []>("op_2227_cast_fp16")];
            tensor<int32, [4]> var_2231_begin_0 = const()[name = tensor<string, []>("op_2231_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_2231_end_0 = const()[name = tensor<string, []>("op_2231_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_2231_end_mask_0 = const()[name = tensor<string, []>("op_2231_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2231_cast_fp16 = slice_by_index(begin = var_2231_begin_0, end = var_2231_end_0, end_mask = var_2231_end_mask_0, x = query_7_cast_fp16)[name = tensor<string, []>("op_2231_cast_fp16")];
            tensor<int32, [4]> var_2235_begin_0 = const()[name = tensor<string, []>("op_2235_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_2235_end_0 = const()[name = tensor<string, []>("op_2235_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_2235_end_mask_0 = const()[name = tensor<string, []>("op_2235_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2235_cast_fp16 = slice_by_index(begin = var_2235_begin_0, end = var_2235_end_0, end_mask = var_2235_end_mask_0, x = query_7_cast_fp16)[name = tensor<string, []>("op_2235_cast_fp16")];
            tensor<int32, [4]> var_2239_begin_0 = const()[name = tensor<string, []>("op_2239_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_2239_end_0 = const()[name = tensor<string, []>("op_2239_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_2239_end_mask_0 = const()[name = tensor<string, []>("op_2239_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2239_cast_fp16 = slice_by_index(begin = var_2239_begin_0, end = var_2239_end_0, end_mask = var_2239_end_mask_0, x = query_7_cast_fp16)[name = tensor<string, []>("op_2239_cast_fp16")];
            tensor<int32, [4]> var_2243_begin_0 = const()[name = tensor<string, []>("op_2243_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_2243_end_0 = const()[name = tensor<string, []>("op_2243_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_2243_end_mask_0 = const()[name = tensor<string, []>("op_2243_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2243_cast_fp16 = slice_by_index(begin = var_2243_begin_0, end = var_2243_end_0, end_mask = var_2243_end_mask_0, x = query_7_cast_fp16)[name = tensor<string, []>("op_2243_cast_fp16")];
            tensor<int32, [4]> var_2252_begin_0 = const()[name = tensor<string, []>("op_2252_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2252_end_0 = const()[name = tensor<string, []>("op_2252_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_2252_end_mask_0 = const()[name = tensor<string, []>("op_2252_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2252_cast_fp16 = slice_by_index(begin = var_2252_begin_0, end = var_2252_end_0, end_mask = var_2252_end_mask_0, x = var_2215_cast_fp16)[name = tensor<string, []>("op_2252_cast_fp16")];
            tensor<int32, [4]> var_2259_begin_0 = const()[name = tensor<string, []>("op_2259_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_2259_end_0 = const()[name = tensor<string, []>("op_2259_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_2259_end_mask_0 = const()[name = tensor<string, []>("op_2259_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2259_cast_fp16 = slice_by_index(begin = var_2259_begin_0, end = var_2259_end_0, end_mask = var_2259_end_mask_0, x = var_2215_cast_fp16)[name = tensor<string, []>("op_2259_cast_fp16")];
            tensor<int32, [4]> var_2266_begin_0 = const()[name = tensor<string, []>("op_2266_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_2266_end_0 = const()[name = tensor<string, []>("op_2266_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_2266_end_mask_0 = const()[name = tensor<string, []>("op_2266_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2266_cast_fp16 = slice_by_index(begin = var_2266_begin_0, end = var_2266_end_0, end_mask = var_2266_end_mask_0, x = var_2215_cast_fp16)[name = tensor<string, []>("op_2266_cast_fp16")];
            tensor<int32, [4]> var_2273_begin_0 = const()[name = tensor<string, []>("op_2273_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_2273_end_0 = const()[name = tensor<string, []>("op_2273_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2273_end_mask_0 = const()[name = tensor<string, []>("op_2273_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2273_cast_fp16 = slice_by_index(begin = var_2273_begin_0, end = var_2273_end_0, end_mask = var_2273_end_mask_0, x = var_2215_cast_fp16)[name = tensor<string, []>("op_2273_cast_fp16")];
            tensor<int32, [4]> var_2280_begin_0 = const()[name = tensor<string, []>("op_2280_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2280_end_0 = const()[name = tensor<string, []>("op_2280_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_2280_end_mask_0 = const()[name = tensor<string, []>("op_2280_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2280_cast_fp16 = slice_by_index(begin = var_2280_begin_0, end = var_2280_end_0, end_mask = var_2280_end_mask_0, x = var_2219_cast_fp16)[name = tensor<string, []>("op_2280_cast_fp16")];
            tensor<int32, [4]> var_2287_begin_0 = const()[name = tensor<string, []>("op_2287_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_2287_end_0 = const()[name = tensor<string, []>("op_2287_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_2287_end_mask_0 = const()[name = tensor<string, []>("op_2287_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2287_cast_fp16 = slice_by_index(begin = var_2287_begin_0, end = var_2287_end_0, end_mask = var_2287_end_mask_0, x = var_2219_cast_fp16)[name = tensor<string, []>("op_2287_cast_fp16")];
            tensor<int32, [4]> var_2294_begin_0 = const()[name = tensor<string, []>("op_2294_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_2294_end_0 = const()[name = tensor<string, []>("op_2294_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_2294_end_mask_0 = const()[name = tensor<string, []>("op_2294_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2294_cast_fp16 = slice_by_index(begin = var_2294_begin_0, end = var_2294_end_0, end_mask = var_2294_end_mask_0, x = var_2219_cast_fp16)[name = tensor<string, []>("op_2294_cast_fp16")];
            tensor<int32, [4]> var_2301_begin_0 = const()[name = tensor<string, []>("op_2301_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_2301_end_0 = const()[name = tensor<string, []>("op_2301_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2301_end_mask_0 = const()[name = tensor<string, []>("op_2301_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2301_cast_fp16 = slice_by_index(begin = var_2301_begin_0, end = var_2301_end_0, end_mask = var_2301_end_mask_0, x = var_2219_cast_fp16)[name = tensor<string, []>("op_2301_cast_fp16")];
            tensor<int32, [4]> var_2308_begin_0 = const()[name = tensor<string, []>("op_2308_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2308_end_0 = const()[name = tensor<string, []>("op_2308_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_2308_end_mask_0 = const()[name = tensor<string, []>("op_2308_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2308_cast_fp16 = slice_by_index(begin = var_2308_begin_0, end = var_2308_end_0, end_mask = var_2308_end_mask_0, x = var_2223_cast_fp16)[name = tensor<string, []>("op_2308_cast_fp16")];
            tensor<int32, [4]> var_2315_begin_0 = const()[name = tensor<string, []>("op_2315_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_2315_end_0 = const()[name = tensor<string, []>("op_2315_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_2315_end_mask_0 = const()[name = tensor<string, []>("op_2315_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2315_cast_fp16 = slice_by_index(begin = var_2315_begin_0, end = var_2315_end_0, end_mask = var_2315_end_mask_0, x = var_2223_cast_fp16)[name = tensor<string, []>("op_2315_cast_fp16")];
            tensor<int32, [4]> var_2322_begin_0 = const()[name = tensor<string, []>("op_2322_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_2322_end_0 = const()[name = tensor<string, []>("op_2322_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_2322_end_mask_0 = const()[name = tensor<string, []>("op_2322_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2322_cast_fp16 = slice_by_index(begin = var_2322_begin_0, end = var_2322_end_0, end_mask = var_2322_end_mask_0, x = var_2223_cast_fp16)[name = tensor<string, []>("op_2322_cast_fp16")];
            tensor<int32, [4]> var_2329_begin_0 = const()[name = tensor<string, []>("op_2329_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_2329_end_0 = const()[name = tensor<string, []>("op_2329_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2329_end_mask_0 = const()[name = tensor<string, []>("op_2329_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2329_cast_fp16 = slice_by_index(begin = var_2329_begin_0, end = var_2329_end_0, end_mask = var_2329_end_mask_0, x = var_2223_cast_fp16)[name = tensor<string, []>("op_2329_cast_fp16")];
            tensor<int32, [4]> var_2336_begin_0 = const()[name = tensor<string, []>("op_2336_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2336_end_0 = const()[name = tensor<string, []>("op_2336_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_2336_end_mask_0 = const()[name = tensor<string, []>("op_2336_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2336_cast_fp16 = slice_by_index(begin = var_2336_begin_0, end = var_2336_end_0, end_mask = var_2336_end_mask_0, x = var_2227_cast_fp16)[name = tensor<string, []>("op_2336_cast_fp16")];
            tensor<int32, [4]> var_2343_begin_0 = const()[name = tensor<string, []>("op_2343_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_2343_end_0 = const()[name = tensor<string, []>("op_2343_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_2343_end_mask_0 = const()[name = tensor<string, []>("op_2343_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2343_cast_fp16 = slice_by_index(begin = var_2343_begin_0, end = var_2343_end_0, end_mask = var_2343_end_mask_0, x = var_2227_cast_fp16)[name = tensor<string, []>("op_2343_cast_fp16")];
            tensor<int32, [4]> var_2350_begin_0 = const()[name = tensor<string, []>("op_2350_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_2350_end_0 = const()[name = tensor<string, []>("op_2350_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_2350_end_mask_0 = const()[name = tensor<string, []>("op_2350_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2350_cast_fp16 = slice_by_index(begin = var_2350_begin_0, end = var_2350_end_0, end_mask = var_2350_end_mask_0, x = var_2227_cast_fp16)[name = tensor<string, []>("op_2350_cast_fp16")];
            tensor<int32, [4]> var_2357_begin_0 = const()[name = tensor<string, []>("op_2357_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_2357_end_0 = const()[name = tensor<string, []>("op_2357_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2357_end_mask_0 = const()[name = tensor<string, []>("op_2357_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2357_cast_fp16 = slice_by_index(begin = var_2357_begin_0, end = var_2357_end_0, end_mask = var_2357_end_mask_0, x = var_2227_cast_fp16)[name = tensor<string, []>("op_2357_cast_fp16")];
            tensor<int32, [4]> var_2364_begin_0 = const()[name = tensor<string, []>("op_2364_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2364_end_0 = const()[name = tensor<string, []>("op_2364_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_2364_end_mask_0 = const()[name = tensor<string, []>("op_2364_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2364_cast_fp16 = slice_by_index(begin = var_2364_begin_0, end = var_2364_end_0, end_mask = var_2364_end_mask_0, x = var_2231_cast_fp16)[name = tensor<string, []>("op_2364_cast_fp16")];
            tensor<int32, [4]> var_2371_begin_0 = const()[name = tensor<string, []>("op_2371_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_2371_end_0 = const()[name = tensor<string, []>("op_2371_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_2371_end_mask_0 = const()[name = tensor<string, []>("op_2371_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2371_cast_fp16 = slice_by_index(begin = var_2371_begin_0, end = var_2371_end_0, end_mask = var_2371_end_mask_0, x = var_2231_cast_fp16)[name = tensor<string, []>("op_2371_cast_fp16")];
            tensor<int32, [4]> var_2378_begin_0 = const()[name = tensor<string, []>("op_2378_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_2378_end_0 = const()[name = tensor<string, []>("op_2378_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_2378_end_mask_0 = const()[name = tensor<string, []>("op_2378_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2378_cast_fp16 = slice_by_index(begin = var_2378_begin_0, end = var_2378_end_0, end_mask = var_2378_end_mask_0, x = var_2231_cast_fp16)[name = tensor<string, []>("op_2378_cast_fp16")];
            tensor<int32, [4]> var_2385_begin_0 = const()[name = tensor<string, []>("op_2385_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_2385_end_0 = const()[name = tensor<string, []>("op_2385_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2385_end_mask_0 = const()[name = tensor<string, []>("op_2385_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2385_cast_fp16 = slice_by_index(begin = var_2385_begin_0, end = var_2385_end_0, end_mask = var_2385_end_mask_0, x = var_2231_cast_fp16)[name = tensor<string, []>("op_2385_cast_fp16")];
            tensor<int32, [4]> var_2392_begin_0 = const()[name = tensor<string, []>("op_2392_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2392_end_0 = const()[name = tensor<string, []>("op_2392_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_2392_end_mask_0 = const()[name = tensor<string, []>("op_2392_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2392_cast_fp16 = slice_by_index(begin = var_2392_begin_0, end = var_2392_end_0, end_mask = var_2392_end_mask_0, x = var_2235_cast_fp16)[name = tensor<string, []>("op_2392_cast_fp16")];
            tensor<int32, [4]> var_2399_begin_0 = const()[name = tensor<string, []>("op_2399_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_2399_end_0 = const()[name = tensor<string, []>("op_2399_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_2399_end_mask_0 = const()[name = tensor<string, []>("op_2399_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2399_cast_fp16 = slice_by_index(begin = var_2399_begin_0, end = var_2399_end_0, end_mask = var_2399_end_mask_0, x = var_2235_cast_fp16)[name = tensor<string, []>("op_2399_cast_fp16")];
            tensor<int32, [4]> var_2406_begin_0 = const()[name = tensor<string, []>("op_2406_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_2406_end_0 = const()[name = tensor<string, []>("op_2406_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_2406_end_mask_0 = const()[name = tensor<string, []>("op_2406_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2406_cast_fp16 = slice_by_index(begin = var_2406_begin_0, end = var_2406_end_0, end_mask = var_2406_end_mask_0, x = var_2235_cast_fp16)[name = tensor<string, []>("op_2406_cast_fp16")];
            tensor<int32, [4]> var_2413_begin_0 = const()[name = tensor<string, []>("op_2413_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_2413_end_0 = const()[name = tensor<string, []>("op_2413_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2413_end_mask_0 = const()[name = tensor<string, []>("op_2413_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2413_cast_fp16 = slice_by_index(begin = var_2413_begin_0, end = var_2413_end_0, end_mask = var_2413_end_mask_0, x = var_2235_cast_fp16)[name = tensor<string, []>("op_2413_cast_fp16")];
            tensor<int32, [4]> var_2420_begin_0 = const()[name = tensor<string, []>("op_2420_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2420_end_0 = const()[name = tensor<string, []>("op_2420_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_2420_end_mask_0 = const()[name = tensor<string, []>("op_2420_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2420_cast_fp16 = slice_by_index(begin = var_2420_begin_0, end = var_2420_end_0, end_mask = var_2420_end_mask_0, x = var_2239_cast_fp16)[name = tensor<string, []>("op_2420_cast_fp16")];
            tensor<int32, [4]> var_2427_begin_0 = const()[name = tensor<string, []>("op_2427_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_2427_end_0 = const()[name = tensor<string, []>("op_2427_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_2427_end_mask_0 = const()[name = tensor<string, []>("op_2427_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2427_cast_fp16 = slice_by_index(begin = var_2427_begin_0, end = var_2427_end_0, end_mask = var_2427_end_mask_0, x = var_2239_cast_fp16)[name = tensor<string, []>("op_2427_cast_fp16")];
            tensor<int32, [4]> var_2434_begin_0 = const()[name = tensor<string, []>("op_2434_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_2434_end_0 = const()[name = tensor<string, []>("op_2434_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_2434_end_mask_0 = const()[name = tensor<string, []>("op_2434_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2434_cast_fp16 = slice_by_index(begin = var_2434_begin_0, end = var_2434_end_0, end_mask = var_2434_end_mask_0, x = var_2239_cast_fp16)[name = tensor<string, []>("op_2434_cast_fp16")];
            tensor<int32, [4]> var_2441_begin_0 = const()[name = tensor<string, []>("op_2441_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_2441_end_0 = const()[name = tensor<string, []>("op_2441_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2441_end_mask_0 = const()[name = tensor<string, []>("op_2441_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2441_cast_fp16 = slice_by_index(begin = var_2441_begin_0, end = var_2441_end_0, end_mask = var_2441_end_mask_0, x = var_2239_cast_fp16)[name = tensor<string, []>("op_2441_cast_fp16")];
            tensor<int32, [4]> var_2448_begin_0 = const()[name = tensor<string, []>("op_2448_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2448_end_0 = const()[name = tensor<string, []>("op_2448_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_2448_end_mask_0 = const()[name = tensor<string, []>("op_2448_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2448_cast_fp16 = slice_by_index(begin = var_2448_begin_0, end = var_2448_end_0, end_mask = var_2448_end_mask_0, x = var_2243_cast_fp16)[name = tensor<string, []>("op_2448_cast_fp16")];
            tensor<int32, [4]> var_2455_begin_0 = const()[name = tensor<string, []>("op_2455_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_2455_end_0 = const()[name = tensor<string, []>("op_2455_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_2455_end_mask_0 = const()[name = tensor<string, []>("op_2455_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2455_cast_fp16 = slice_by_index(begin = var_2455_begin_0, end = var_2455_end_0, end_mask = var_2455_end_mask_0, x = var_2243_cast_fp16)[name = tensor<string, []>("op_2455_cast_fp16")];
            tensor<int32, [4]> var_2462_begin_0 = const()[name = tensor<string, []>("op_2462_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_2462_end_0 = const()[name = tensor<string, []>("op_2462_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_2462_end_mask_0 = const()[name = tensor<string, []>("op_2462_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2462_cast_fp16 = slice_by_index(begin = var_2462_begin_0, end = var_2462_end_0, end_mask = var_2462_end_mask_0, x = var_2243_cast_fp16)[name = tensor<string, []>("op_2462_cast_fp16")];
            tensor<int32, [4]> var_2469_begin_0 = const()[name = tensor<string, []>("op_2469_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_2469_end_0 = const()[name = tensor<string, []>("op_2469_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2469_end_mask_0 = const()[name = tensor<string, []>("op_2469_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2469_cast_fp16 = slice_by_index(begin = var_2469_begin_0, end = var_2469_end_0, end_mask = var_2469_end_mask_0, x = var_2243_cast_fp16)[name = tensor<string, []>("op_2469_cast_fp16")];
            tensor<int32, [4]> k_7_perm_0 = const()[name = tensor<string, []>("k_7_perm_0"), val = tensor<int32, [4]>([0, 3, 2, 1])];
            tensor<int32, [4]> var_2474_begin_0 = const()[name = tensor<string, []>("op_2474_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2474_end_0 = const()[name = tensor<string, []>("op_2474_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 64])];
            tensor<bool, [4]> var_2474_end_mask_0 = const()[name = tensor<string, []>("op_2474_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 512]> transpose_2 = transpose(perm = k_7_perm_0, x = key_7_cast_fp16)[name = tensor<string, []>("transpose_2")];
            tensor<fp16, [1, 1500, 1, 64]> var_2474_cast_fp16 = slice_by_index(begin = var_2474_begin_0, end = var_2474_end_0, end_mask = var_2474_end_mask_0, x = transpose_2)[name = tensor<string, []>("op_2474_cast_fp16")];
            tensor<int32, [4]> var_2478_begin_0 = const()[name = tensor<string, []>("op_2478_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 64])];
            tensor<int32, [4]> var_2478_end_0 = const()[name = tensor<string, []>("op_2478_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 128])];
            tensor<bool, [4]> var_2478_end_mask_0 = const()[name = tensor<string, []>("op_2478_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_2478_cast_fp16 = slice_by_index(begin = var_2478_begin_0, end = var_2478_end_0, end_mask = var_2478_end_mask_0, x = transpose_2)[name = tensor<string, []>("op_2478_cast_fp16")];
            tensor<int32, [4]> var_2482_begin_0 = const()[name = tensor<string, []>("op_2482_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 128])];
            tensor<int32, [4]> var_2482_end_0 = const()[name = tensor<string, []>("op_2482_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 192])];
            tensor<bool, [4]> var_2482_end_mask_0 = const()[name = tensor<string, []>("op_2482_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_2482_cast_fp16 = slice_by_index(begin = var_2482_begin_0, end = var_2482_end_0, end_mask = var_2482_end_mask_0, x = transpose_2)[name = tensor<string, []>("op_2482_cast_fp16")];
            tensor<int32, [4]> var_2486_begin_0 = const()[name = tensor<string, []>("op_2486_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 192])];
            tensor<int32, [4]> var_2486_end_0 = const()[name = tensor<string, []>("op_2486_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 256])];
            tensor<bool, [4]> var_2486_end_mask_0 = const()[name = tensor<string, []>("op_2486_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_2486_cast_fp16 = slice_by_index(begin = var_2486_begin_0, end = var_2486_end_0, end_mask = var_2486_end_mask_0, x = transpose_2)[name = tensor<string, []>("op_2486_cast_fp16")];
            tensor<int32, [4]> var_2490_begin_0 = const()[name = tensor<string, []>("op_2490_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 256])];
            tensor<int32, [4]> var_2490_end_0 = const()[name = tensor<string, []>("op_2490_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 320])];
            tensor<bool, [4]> var_2490_end_mask_0 = const()[name = tensor<string, []>("op_2490_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_2490_cast_fp16 = slice_by_index(begin = var_2490_begin_0, end = var_2490_end_0, end_mask = var_2490_end_mask_0, x = transpose_2)[name = tensor<string, []>("op_2490_cast_fp16")];
            tensor<int32, [4]> var_2494_begin_0 = const()[name = tensor<string, []>("op_2494_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 320])];
            tensor<int32, [4]> var_2494_end_0 = const()[name = tensor<string, []>("op_2494_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 384])];
            tensor<bool, [4]> var_2494_end_mask_0 = const()[name = tensor<string, []>("op_2494_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_2494_cast_fp16 = slice_by_index(begin = var_2494_begin_0, end = var_2494_end_0, end_mask = var_2494_end_mask_0, x = transpose_2)[name = tensor<string, []>("op_2494_cast_fp16")];
            tensor<int32, [4]> var_2498_begin_0 = const()[name = tensor<string, []>("op_2498_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 384])];
            tensor<int32, [4]> var_2498_end_0 = const()[name = tensor<string, []>("op_2498_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 448])];
            tensor<bool, [4]> var_2498_end_mask_0 = const()[name = tensor<string, []>("op_2498_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_2498_cast_fp16 = slice_by_index(begin = var_2498_begin_0, end = var_2498_end_0, end_mask = var_2498_end_mask_0, x = transpose_2)[name = tensor<string, []>("op_2498_cast_fp16")];
            tensor<int32, [4]> var_2502_begin_0 = const()[name = tensor<string, []>("op_2502_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 448])];
            tensor<int32, [4]> var_2502_end_0 = const()[name = tensor<string, []>("op_2502_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 512])];
            tensor<bool, [4]> var_2502_end_mask_0 = const()[name = tensor<string, []>("op_2502_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_2502_cast_fp16 = slice_by_index(begin = var_2502_begin_0, end = var_2502_end_0, end_mask = var_2502_end_mask_0, x = transpose_2)[name = tensor<string, []>("op_2502_cast_fp16")];
            tensor<int32, [4]> var_2504_begin_0 = const()[name = tensor<string, []>("op_2504_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2504_end_0 = const()[name = tensor<string, []>("op_2504_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2504_end_mask_0 = const()[name = tensor<string, []>("op_2504_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2504_cast_fp16 = slice_by_index(begin = var_2504_begin_0, end = var_2504_end_0, end_mask = var_2504_end_mask_0, x = value_7_cast_fp16)[name = tensor<string, []>("op_2504_cast_fp16")];
            tensor<int32, [4]> var_2508_begin_0 = const()[name = tensor<string, []>("op_2508_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_2508_end_0 = const()[name = tensor<string, []>("op_2508_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_2508_end_mask_0 = const()[name = tensor<string, []>("op_2508_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2508_cast_fp16 = slice_by_index(begin = var_2508_begin_0, end = var_2508_end_0, end_mask = var_2508_end_mask_0, x = value_7_cast_fp16)[name = tensor<string, []>("op_2508_cast_fp16")];
            tensor<int32, [4]> var_2512_begin_0 = const()[name = tensor<string, []>("op_2512_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_2512_end_0 = const()[name = tensor<string, []>("op_2512_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_2512_end_mask_0 = const()[name = tensor<string, []>("op_2512_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2512_cast_fp16 = slice_by_index(begin = var_2512_begin_0, end = var_2512_end_0, end_mask = var_2512_end_mask_0, x = value_7_cast_fp16)[name = tensor<string, []>("op_2512_cast_fp16")];
            tensor<int32, [4]> var_2516_begin_0 = const()[name = tensor<string, []>("op_2516_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_2516_end_0 = const()[name = tensor<string, []>("op_2516_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_2516_end_mask_0 = const()[name = tensor<string, []>("op_2516_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2516_cast_fp16 = slice_by_index(begin = var_2516_begin_0, end = var_2516_end_0, end_mask = var_2516_end_mask_0, x = value_7_cast_fp16)[name = tensor<string, []>("op_2516_cast_fp16")];
            tensor<int32, [4]> var_2520_begin_0 = const()[name = tensor<string, []>("op_2520_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_2520_end_0 = const()[name = tensor<string, []>("op_2520_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_2520_end_mask_0 = const()[name = tensor<string, []>("op_2520_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2520_cast_fp16 = slice_by_index(begin = var_2520_begin_0, end = var_2520_end_0, end_mask = var_2520_end_mask_0, x = value_7_cast_fp16)[name = tensor<string, []>("op_2520_cast_fp16")];
            tensor<int32, [4]> var_2524_begin_0 = const()[name = tensor<string, []>("op_2524_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_2524_end_0 = const()[name = tensor<string, []>("op_2524_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_2524_end_mask_0 = const()[name = tensor<string, []>("op_2524_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2524_cast_fp16 = slice_by_index(begin = var_2524_begin_0, end = var_2524_end_0, end_mask = var_2524_end_mask_0, x = value_7_cast_fp16)[name = tensor<string, []>("op_2524_cast_fp16")];
            tensor<int32, [4]> var_2528_begin_0 = const()[name = tensor<string, []>("op_2528_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_2528_end_0 = const()[name = tensor<string, []>("op_2528_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_2528_end_mask_0 = const()[name = tensor<string, []>("op_2528_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2528_cast_fp16 = slice_by_index(begin = var_2528_begin_0, end = var_2528_end_0, end_mask = var_2528_end_mask_0, x = value_7_cast_fp16)[name = tensor<string, []>("op_2528_cast_fp16")];
            tensor<int32, [4]> var_2532_begin_0 = const()[name = tensor<string, []>("op_2532_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_2532_end_0 = const()[name = tensor<string, []>("op_2532_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_2532_end_mask_0 = const()[name = tensor<string, []>("op_2532_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2532_cast_fp16 = slice_by_index(begin = var_2532_begin_0, end = var_2532_end_0, end_mask = var_2532_end_mask_0, x = value_7_cast_fp16)[name = tensor<string, []>("op_2532_cast_fp16")];
            tensor<string, []> var_2536_equation_0 = const()[name = tensor<string, []>("op_2536_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2536_cast_fp16 = einsum(equation = var_2536_equation_0, values = (var_2474_cast_fp16, var_2252_cast_fp16))[name = tensor<string, []>("op_2536_cast_fp16")];
            tensor<fp16, []> var_2537_to_fp16 = const()[name = tensor<string, []>("op_2537_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_193_cast_fp16 = mul(x = var_2536_cast_fp16, y = var_2537_to_fp16)[name = tensor<string, []>("aw_chunk_193_cast_fp16")];
            tensor<string, []> var_2540_equation_0 = const()[name = tensor<string, []>("op_2540_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2540_cast_fp16 = einsum(equation = var_2540_equation_0, values = (var_2474_cast_fp16, var_2259_cast_fp16))[name = tensor<string, []>("op_2540_cast_fp16")];
            tensor<fp16, []> var_2541_to_fp16 = const()[name = tensor<string, []>("op_2541_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_195_cast_fp16 = mul(x = var_2540_cast_fp16, y = var_2541_to_fp16)[name = tensor<string, []>("aw_chunk_195_cast_fp16")];
            tensor<string, []> var_2544_equation_0 = const()[name = tensor<string, []>("op_2544_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2544_cast_fp16 = einsum(equation = var_2544_equation_0, values = (var_2474_cast_fp16, var_2266_cast_fp16))[name = tensor<string, []>("op_2544_cast_fp16")];
            tensor<fp16, []> var_2545_to_fp16 = const()[name = tensor<string, []>("op_2545_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_197_cast_fp16 = mul(x = var_2544_cast_fp16, y = var_2545_to_fp16)[name = tensor<string, []>("aw_chunk_197_cast_fp16")];
            tensor<string, []> var_2548_equation_0 = const()[name = tensor<string, []>("op_2548_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2548_cast_fp16 = einsum(equation = var_2548_equation_0, values = (var_2474_cast_fp16, var_2273_cast_fp16))[name = tensor<string, []>("op_2548_cast_fp16")];
            tensor<fp16, []> var_2549_to_fp16 = const()[name = tensor<string, []>("op_2549_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_199_cast_fp16 = mul(x = var_2548_cast_fp16, y = var_2549_to_fp16)[name = tensor<string, []>("aw_chunk_199_cast_fp16")];
            tensor<string, []> var_2552_equation_0 = const()[name = tensor<string, []>("op_2552_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2552_cast_fp16 = einsum(equation = var_2552_equation_0, values = (var_2478_cast_fp16, var_2280_cast_fp16))[name = tensor<string, []>("op_2552_cast_fp16")];
            tensor<fp16, []> var_2553_to_fp16 = const()[name = tensor<string, []>("op_2553_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_201_cast_fp16 = mul(x = var_2552_cast_fp16, y = var_2553_to_fp16)[name = tensor<string, []>("aw_chunk_201_cast_fp16")];
            tensor<string, []> var_2556_equation_0 = const()[name = tensor<string, []>("op_2556_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2556_cast_fp16 = einsum(equation = var_2556_equation_0, values = (var_2478_cast_fp16, var_2287_cast_fp16))[name = tensor<string, []>("op_2556_cast_fp16")];
            tensor<fp16, []> var_2557_to_fp16 = const()[name = tensor<string, []>("op_2557_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_203_cast_fp16 = mul(x = var_2556_cast_fp16, y = var_2557_to_fp16)[name = tensor<string, []>("aw_chunk_203_cast_fp16")];
            tensor<string, []> var_2560_equation_0 = const()[name = tensor<string, []>("op_2560_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2560_cast_fp16 = einsum(equation = var_2560_equation_0, values = (var_2478_cast_fp16, var_2294_cast_fp16))[name = tensor<string, []>("op_2560_cast_fp16")];
            tensor<fp16, []> var_2561_to_fp16 = const()[name = tensor<string, []>("op_2561_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_205_cast_fp16 = mul(x = var_2560_cast_fp16, y = var_2561_to_fp16)[name = tensor<string, []>("aw_chunk_205_cast_fp16")];
            tensor<string, []> var_2564_equation_0 = const()[name = tensor<string, []>("op_2564_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2564_cast_fp16 = einsum(equation = var_2564_equation_0, values = (var_2478_cast_fp16, var_2301_cast_fp16))[name = tensor<string, []>("op_2564_cast_fp16")];
            tensor<fp16, []> var_2565_to_fp16 = const()[name = tensor<string, []>("op_2565_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_207_cast_fp16 = mul(x = var_2564_cast_fp16, y = var_2565_to_fp16)[name = tensor<string, []>("aw_chunk_207_cast_fp16")];
            tensor<string, []> var_2568_equation_0 = const()[name = tensor<string, []>("op_2568_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2568_cast_fp16 = einsum(equation = var_2568_equation_0, values = (var_2482_cast_fp16, var_2308_cast_fp16))[name = tensor<string, []>("op_2568_cast_fp16")];
            tensor<fp16, []> var_2569_to_fp16 = const()[name = tensor<string, []>("op_2569_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_209_cast_fp16 = mul(x = var_2568_cast_fp16, y = var_2569_to_fp16)[name = tensor<string, []>("aw_chunk_209_cast_fp16")];
            tensor<string, []> var_2572_equation_0 = const()[name = tensor<string, []>("op_2572_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2572_cast_fp16 = einsum(equation = var_2572_equation_0, values = (var_2482_cast_fp16, var_2315_cast_fp16))[name = tensor<string, []>("op_2572_cast_fp16")];
            tensor<fp16, []> var_2573_to_fp16 = const()[name = tensor<string, []>("op_2573_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_211_cast_fp16 = mul(x = var_2572_cast_fp16, y = var_2573_to_fp16)[name = tensor<string, []>("aw_chunk_211_cast_fp16")];
            tensor<string, []> var_2576_equation_0 = const()[name = tensor<string, []>("op_2576_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2576_cast_fp16 = einsum(equation = var_2576_equation_0, values = (var_2482_cast_fp16, var_2322_cast_fp16))[name = tensor<string, []>("op_2576_cast_fp16")];
            tensor<fp16, []> var_2577_to_fp16 = const()[name = tensor<string, []>("op_2577_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_213_cast_fp16 = mul(x = var_2576_cast_fp16, y = var_2577_to_fp16)[name = tensor<string, []>("aw_chunk_213_cast_fp16")];
            tensor<string, []> var_2580_equation_0 = const()[name = tensor<string, []>("op_2580_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2580_cast_fp16 = einsum(equation = var_2580_equation_0, values = (var_2482_cast_fp16, var_2329_cast_fp16))[name = tensor<string, []>("op_2580_cast_fp16")];
            tensor<fp16, []> var_2581_to_fp16 = const()[name = tensor<string, []>("op_2581_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_215_cast_fp16 = mul(x = var_2580_cast_fp16, y = var_2581_to_fp16)[name = tensor<string, []>("aw_chunk_215_cast_fp16")];
            tensor<string, []> var_2584_equation_0 = const()[name = tensor<string, []>("op_2584_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2584_cast_fp16 = einsum(equation = var_2584_equation_0, values = (var_2486_cast_fp16, var_2336_cast_fp16))[name = tensor<string, []>("op_2584_cast_fp16")];
            tensor<fp16, []> var_2585_to_fp16 = const()[name = tensor<string, []>("op_2585_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_217_cast_fp16 = mul(x = var_2584_cast_fp16, y = var_2585_to_fp16)[name = tensor<string, []>("aw_chunk_217_cast_fp16")];
            tensor<string, []> var_2588_equation_0 = const()[name = tensor<string, []>("op_2588_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2588_cast_fp16 = einsum(equation = var_2588_equation_0, values = (var_2486_cast_fp16, var_2343_cast_fp16))[name = tensor<string, []>("op_2588_cast_fp16")];
            tensor<fp16, []> var_2589_to_fp16 = const()[name = tensor<string, []>("op_2589_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_219_cast_fp16 = mul(x = var_2588_cast_fp16, y = var_2589_to_fp16)[name = tensor<string, []>("aw_chunk_219_cast_fp16")];
            tensor<string, []> var_2592_equation_0 = const()[name = tensor<string, []>("op_2592_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2592_cast_fp16 = einsum(equation = var_2592_equation_0, values = (var_2486_cast_fp16, var_2350_cast_fp16))[name = tensor<string, []>("op_2592_cast_fp16")];
            tensor<fp16, []> var_2593_to_fp16 = const()[name = tensor<string, []>("op_2593_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_221_cast_fp16 = mul(x = var_2592_cast_fp16, y = var_2593_to_fp16)[name = tensor<string, []>("aw_chunk_221_cast_fp16")];
            tensor<string, []> var_2596_equation_0 = const()[name = tensor<string, []>("op_2596_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2596_cast_fp16 = einsum(equation = var_2596_equation_0, values = (var_2486_cast_fp16, var_2357_cast_fp16))[name = tensor<string, []>("op_2596_cast_fp16")];
            tensor<fp16, []> var_2597_to_fp16 = const()[name = tensor<string, []>("op_2597_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_223_cast_fp16 = mul(x = var_2596_cast_fp16, y = var_2597_to_fp16)[name = tensor<string, []>("aw_chunk_223_cast_fp16")];
            tensor<string, []> var_2600_equation_0 = const()[name = tensor<string, []>("op_2600_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2600_cast_fp16 = einsum(equation = var_2600_equation_0, values = (var_2490_cast_fp16, var_2364_cast_fp16))[name = tensor<string, []>("op_2600_cast_fp16")];
            tensor<fp16, []> var_2601_to_fp16 = const()[name = tensor<string, []>("op_2601_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_225_cast_fp16 = mul(x = var_2600_cast_fp16, y = var_2601_to_fp16)[name = tensor<string, []>("aw_chunk_225_cast_fp16")];
            tensor<string, []> var_2604_equation_0 = const()[name = tensor<string, []>("op_2604_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2604_cast_fp16 = einsum(equation = var_2604_equation_0, values = (var_2490_cast_fp16, var_2371_cast_fp16))[name = tensor<string, []>("op_2604_cast_fp16")];
            tensor<fp16, []> var_2605_to_fp16 = const()[name = tensor<string, []>("op_2605_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_227_cast_fp16 = mul(x = var_2604_cast_fp16, y = var_2605_to_fp16)[name = tensor<string, []>("aw_chunk_227_cast_fp16")];
            tensor<string, []> var_2608_equation_0 = const()[name = tensor<string, []>("op_2608_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2608_cast_fp16 = einsum(equation = var_2608_equation_0, values = (var_2490_cast_fp16, var_2378_cast_fp16))[name = tensor<string, []>("op_2608_cast_fp16")];
            tensor<fp16, []> var_2609_to_fp16 = const()[name = tensor<string, []>("op_2609_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_229_cast_fp16 = mul(x = var_2608_cast_fp16, y = var_2609_to_fp16)[name = tensor<string, []>("aw_chunk_229_cast_fp16")];
            tensor<string, []> var_2612_equation_0 = const()[name = tensor<string, []>("op_2612_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2612_cast_fp16 = einsum(equation = var_2612_equation_0, values = (var_2490_cast_fp16, var_2385_cast_fp16))[name = tensor<string, []>("op_2612_cast_fp16")];
            tensor<fp16, []> var_2613_to_fp16 = const()[name = tensor<string, []>("op_2613_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_231_cast_fp16 = mul(x = var_2612_cast_fp16, y = var_2613_to_fp16)[name = tensor<string, []>("aw_chunk_231_cast_fp16")];
            tensor<string, []> var_2616_equation_0 = const()[name = tensor<string, []>("op_2616_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2616_cast_fp16 = einsum(equation = var_2616_equation_0, values = (var_2494_cast_fp16, var_2392_cast_fp16))[name = tensor<string, []>("op_2616_cast_fp16")];
            tensor<fp16, []> var_2617_to_fp16 = const()[name = tensor<string, []>("op_2617_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_233_cast_fp16 = mul(x = var_2616_cast_fp16, y = var_2617_to_fp16)[name = tensor<string, []>("aw_chunk_233_cast_fp16")];
            tensor<string, []> var_2620_equation_0 = const()[name = tensor<string, []>("op_2620_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2620_cast_fp16 = einsum(equation = var_2620_equation_0, values = (var_2494_cast_fp16, var_2399_cast_fp16))[name = tensor<string, []>("op_2620_cast_fp16")];
            tensor<fp16, []> var_2621_to_fp16 = const()[name = tensor<string, []>("op_2621_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_235_cast_fp16 = mul(x = var_2620_cast_fp16, y = var_2621_to_fp16)[name = tensor<string, []>("aw_chunk_235_cast_fp16")];
            tensor<string, []> var_2624_equation_0 = const()[name = tensor<string, []>("op_2624_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2624_cast_fp16 = einsum(equation = var_2624_equation_0, values = (var_2494_cast_fp16, var_2406_cast_fp16))[name = tensor<string, []>("op_2624_cast_fp16")];
            tensor<fp16, []> var_2625_to_fp16 = const()[name = tensor<string, []>("op_2625_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_237_cast_fp16 = mul(x = var_2624_cast_fp16, y = var_2625_to_fp16)[name = tensor<string, []>("aw_chunk_237_cast_fp16")];
            tensor<string, []> var_2628_equation_0 = const()[name = tensor<string, []>("op_2628_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2628_cast_fp16 = einsum(equation = var_2628_equation_0, values = (var_2494_cast_fp16, var_2413_cast_fp16))[name = tensor<string, []>("op_2628_cast_fp16")];
            tensor<fp16, []> var_2629_to_fp16 = const()[name = tensor<string, []>("op_2629_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_239_cast_fp16 = mul(x = var_2628_cast_fp16, y = var_2629_to_fp16)[name = tensor<string, []>("aw_chunk_239_cast_fp16")];
            tensor<string, []> var_2632_equation_0 = const()[name = tensor<string, []>("op_2632_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2632_cast_fp16 = einsum(equation = var_2632_equation_0, values = (var_2498_cast_fp16, var_2420_cast_fp16))[name = tensor<string, []>("op_2632_cast_fp16")];
            tensor<fp16, []> var_2633_to_fp16 = const()[name = tensor<string, []>("op_2633_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_241_cast_fp16 = mul(x = var_2632_cast_fp16, y = var_2633_to_fp16)[name = tensor<string, []>("aw_chunk_241_cast_fp16")];
            tensor<string, []> var_2636_equation_0 = const()[name = tensor<string, []>("op_2636_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2636_cast_fp16 = einsum(equation = var_2636_equation_0, values = (var_2498_cast_fp16, var_2427_cast_fp16))[name = tensor<string, []>("op_2636_cast_fp16")];
            tensor<fp16, []> var_2637_to_fp16 = const()[name = tensor<string, []>("op_2637_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_243_cast_fp16 = mul(x = var_2636_cast_fp16, y = var_2637_to_fp16)[name = tensor<string, []>("aw_chunk_243_cast_fp16")];
            tensor<string, []> var_2640_equation_0 = const()[name = tensor<string, []>("op_2640_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2640_cast_fp16 = einsum(equation = var_2640_equation_0, values = (var_2498_cast_fp16, var_2434_cast_fp16))[name = tensor<string, []>("op_2640_cast_fp16")];
            tensor<fp16, []> var_2641_to_fp16 = const()[name = tensor<string, []>("op_2641_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_245_cast_fp16 = mul(x = var_2640_cast_fp16, y = var_2641_to_fp16)[name = tensor<string, []>("aw_chunk_245_cast_fp16")];
            tensor<string, []> var_2644_equation_0 = const()[name = tensor<string, []>("op_2644_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2644_cast_fp16 = einsum(equation = var_2644_equation_0, values = (var_2498_cast_fp16, var_2441_cast_fp16))[name = tensor<string, []>("op_2644_cast_fp16")];
            tensor<fp16, []> var_2645_to_fp16 = const()[name = tensor<string, []>("op_2645_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_247_cast_fp16 = mul(x = var_2644_cast_fp16, y = var_2645_to_fp16)[name = tensor<string, []>("aw_chunk_247_cast_fp16")];
            tensor<string, []> var_2648_equation_0 = const()[name = tensor<string, []>("op_2648_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2648_cast_fp16 = einsum(equation = var_2648_equation_0, values = (var_2502_cast_fp16, var_2448_cast_fp16))[name = tensor<string, []>("op_2648_cast_fp16")];
            tensor<fp16, []> var_2649_to_fp16 = const()[name = tensor<string, []>("op_2649_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_249_cast_fp16 = mul(x = var_2648_cast_fp16, y = var_2649_to_fp16)[name = tensor<string, []>("aw_chunk_249_cast_fp16")];
            tensor<string, []> var_2652_equation_0 = const()[name = tensor<string, []>("op_2652_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2652_cast_fp16 = einsum(equation = var_2652_equation_0, values = (var_2502_cast_fp16, var_2455_cast_fp16))[name = tensor<string, []>("op_2652_cast_fp16")];
            tensor<fp16, []> var_2653_to_fp16 = const()[name = tensor<string, []>("op_2653_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_251_cast_fp16 = mul(x = var_2652_cast_fp16, y = var_2653_to_fp16)[name = tensor<string, []>("aw_chunk_251_cast_fp16")];
            tensor<string, []> var_2656_equation_0 = const()[name = tensor<string, []>("op_2656_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2656_cast_fp16 = einsum(equation = var_2656_equation_0, values = (var_2502_cast_fp16, var_2462_cast_fp16))[name = tensor<string, []>("op_2656_cast_fp16")];
            tensor<fp16, []> var_2657_to_fp16 = const()[name = tensor<string, []>("op_2657_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_253_cast_fp16 = mul(x = var_2656_cast_fp16, y = var_2657_to_fp16)[name = tensor<string, []>("aw_chunk_253_cast_fp16")];
            tensor<string, []> var_2660_equation_0 = const()[name = tensor<string, []>("op_2660_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_2660_cast_fp16 = einsum(equation = var_2660_equation_0, values = (var_2502_cast_fp16, var_2469_cast_fp16))[name = tensor<string, []>("op_2660_cast_fp16")];
            tensor<fp16, []> var_2661_to_fp16 = const()[name = tensor<string, []>("op_2661_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_255_cast_fp16 = mul(x = var_2660_cast_fp16, y = var_2661_to_fp16)[name = tensor<string, []>("aw_chunk_255_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2663_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_193_cast_fp16)[name = tensor<string, []>("op_2663_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2664_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_195_cast_fp16)[name = tensor<string, []>("op_2664_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2665_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_197_cast_fp16)[name = tensor<string, []>("op_2665_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2666_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_199_cast_fp16)[name = tensor<string, []>("op_2666_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2667_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_201_cast_fp16)[name = tensor<string, []>("op_2667_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2668_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_203_cast_fp16)[name = tensor<string, []>("op_2668_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2669_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_205_cast_fp16)[name = tensor<string, []>("op_2669_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2670_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_207_cast_fp16)[name = tensor<string, []>("op_2670_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2671_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_209_cast_fp16)[name = tensor<string, []>("op_2671_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2672_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_211_cast_fp16)[name = tensor<string, []>("op_2672_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2673_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_213_cast_fp16)[name = tensor<string, []>("op_2673_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2674_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_215_cast_fp16)[name = tensor<string, []>("op_2674_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2675_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_217_cast_fp16)[name = tensor<string, []>("op_2675_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2676_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_219_cast_fp16)[name = tensor<string, []>("op_2676_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2677_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_221_cast_fp16)[name = tensor<string, []>("op_2677_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2678_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_223_cast_fp16)[name = tensor<string, []>("op_2678_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2679_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_225_cast_fp16)[name = tensor<string, []>("op_2679_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2680_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_227_cast_fp16)[name = tensor<string, []>("op_2680_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2681_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_229_cast_fp16)[name = tensor<string, []>("op_2681_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2682_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_231_cast_fp16)[name = tensor<string, []>("op_2682_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2683_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_233_cast_fp16)[name = tensor<string, []>("op_2683_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2684_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_235_cast_fp16)[name = tensor<string, []>("op_2684_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2685_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_237_cast_fp16)[name = tensor<string, []>("op_2685_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2686_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_239_cast_fp16)[name = tensor<string, []>("op_2686_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2687_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_241_cast_fp16)[name = tensor<string, []>("op_2687_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2688_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_243_cast_fp16)[name = tensor<string, []>("op_2688_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2689_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_245_cast_fp16)[name = tensor<string, []>("op_2689_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2690_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_247_cast_fp16)[name = tensor<string, []>("op_2690_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2691_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_249_cast_fp16)[name = tensor<string, []>("op_2691_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2692_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_251_cast_fp16)[name = tensor<string, []>("op_2692_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2693_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_253_cast_fp16)[name = tensor<string, []>("op_2693_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_2694_cast_fp16 = softmax(axis = var_2160, x = aw_chunk_255_cast_fp16)[name = tensor<string, []>("op_2694_cast_fp16")];
            tensor<string, []> var_2696_equation_0 = const()[name = tensor<string, []>("op_2696_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2696_cast_fp16 = einsum(equation = var_2696_equation_0, values = (var_2504_cast_fp16, var_2663_cast_fp16))[name = tensor<string, []>("op_2696_cast_fp16")];
            tensor<string, []> var_2698_equation_0 = const()[name = tensor<string, []>("op_2698_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2698_cast_fp16 = einsum(equation = var_2698_equation_0, values = (var_2504_cast_fp16, var_2664_cast_fp16))[name = tensor<string, []>("op_2698_cast_fp16")];
            tensor<string, []> var_2700_equation_0 = const()[name = tensor<string, []>("op_2700_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2700_cast_fp16 = einsum(equation = var_2700_equation_0, values = (var_2504_cast_fp16, var_2665_cast_fp16))[name = tensor<string, []>("op_2700_cast_fp16")];
            tensor<string, []> var_2702_equation_0 = const()[name = tensor<string, []>("op_2702_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2702_cast_fp16 = einsum(equation = var_2702_equation_0, values = (var_2504_cast_fp16, var_2666_cast_fp16))[name = tensor<string, []>("op_2702_cast_fp16")];
            tensor<string, []> var_2704_equation_0 = const()[name = tensor<string, []>("op_2704_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2704_cast_fp16 = einsum(equation = var_2704_equation_0, values = (var_2508_cast_fp16, var_2667_cast_fp16))[name = tensor<string, []>("op_2704_cast_fp16")];
            tensor<string, []> var_2706_equation_0 = const()[name = tensor<string, []>("op_2706_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2706_cast_fp16 = einsum(equation = var_2706_equation_0, values = (var_2508_cast_fp16, var_2668_cast_fp16))[name = tensor<string, []>("op_2706_cast_fp16")];
            tensor<string, []> var_2708_equation_0 = const()[name = tensor<string, []>("op_2708_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2708_cast_fp16 = einsum(equation = var_2708_equation_0, values = (var_2508_cast_fp16, var_2669_cast_fp16))[name = tensor<string, []>("op_2708_cast_fp16")];
            tensor<string, []> var_2710_equation_0 = const()[name = tensor<string, []>("op_2710_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2710_cast_fp16 = einsum(equation = var_2710_equation_0, values = (var_2508_cast_fp16, var_2670_cast_fp16))[name = tensor<string, []>("op_2710_cast_fp16")];
            tensor<string, []> var_2712_equation_0 = const()[name = tensor<string, []>("op_2712_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2712_cast_fp16 = einsum(equation = var_2712_equation_0, values = (var_2512_cast_fp16, var_2671_cast_fp16))[name = tensor<string, []>("op_2712_cast_fp16")];
            tensor<string, []> var_2714_equation_0 = const()[name = tensor<string, []>("op_2714_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2714_cast_fp16 = einsum(equation = var_2714_equation_0, values = (var_2512_cast_fp16, var_2672_cast_fp16))[name = tensor<string, []>("op_2714_cast_fp16")];
            tensor<string, []> var_2716_equation_0 = const()[name = tensor<string, []>("op_2716_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2716_cast_fp16 = einsum(equation = var_2716_equation_0, values = (var_2512_cast_fp16, var_2673_cast_fp16))[name = tensor<string, []>("op_2716_cast_fp16")];
            tensor<string, []> var_2718_equation_0 = const()[name = tensor<string, []>("op_2718_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2718_cast_fp16 = einsum(equation = var_2718_equation_0, values = (var_2512_cast_fp16, var_2674_cast_fp16))[name = tensor<string, []>("op_2718_cast_fp16")];
            tensor<string, []> var_2720_equation_0 = const()[name = tensor<string, []>("op_2720_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2720_cast_fp16 = einsum(equation = var_2720_equation_0, values = (var_2516_cast_fp16, var_2675_cast_fp16))[name = tensor<string, []>("op_2720_cast_fp16")];
            tensor<string, []> var_2722_equation_0 = const()[name = tensor<string, []>("op_2722_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2722_cast_fp16 = einsum(equation = var_2722_equation_0, values = (var_2516_cast_fp16, var_2676_cast_fp16))[name = tensor<string, []>("op_2722_cast_fp16")];
            tensor<string, []> var_2724_equation_0 = const()[name = tensor<string, []>("op_2724_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2724_cast_fp16 = einsum(equation = var_2724_equation_0, values = (var_2516_cast_fp16, var_2677_cast_fp16))[name = tensor<string, []>("op_2724_cast_fp16")];
            tensor<string, []> var_2726_equation_0 = const()[name = tensor<string, []>("op_2726_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2726_cast_fp16 = einsum(equation = var_2726_equation_0, values = (var_2516_cast_fp16, var_2678_cast_fp16))[name = tensor<string, []>("op_2726_cast_fp16")];
            tensor<string, []> var_2728_equation_0 = const()[name = tensor<string, []>("op_2728_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2728_cast_fp16 = einsum(equation = var_2728_equation_0, values = (var_2520_cast_fp16, var_2679_cast_fp16))[name = tensor<string, []>("op_2728_cast_fp16")];
            tensor<string, []> var_2730_equation_0 = const()[name = tensor<string, []>("op_2730_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2730_cast_fp16 = einsum(equation = var_2730_equation_0, values = (var_2520_cast_fp16, var_2680_cast_fp16))[name = tensor<string, []>("op_2730_cast_fp16")];
            tensor<string, []> var_2732_equation_0 = const()[name = tensor<string, []>("op_2732_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2732_cast_fp16 = einsum(equation = var_2732_equation_0, values = (var_2520_cast_fp16, var_2681_cast_fp16))[name = tensor<string, []>("op_2732_cast_fp16")];
            tensor<string, []> var_2734_equation_0 = const()[name = tensor<string, []>("op_2734_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2734_cast_fp16 = einsum(equation = var_2734_equation_0, values = (var_2520_cast_fp16, var_2682_cast_fp16))[name = tensor<string, []>("op_2734_cast_fp16")];
            tensor<string, []> var_2736_equation_0 = const()[name = tensor<string, []>("op_2736_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2736_cast_fp16 = einsum(equation = var_2736_equation_0, values = (var_2524_cast_fp16, var_2683_cast_fp16))[name = tensor<string, []>("op_2736_cast_fp16")];
            tensor<string, []> var_2738_equation_0 = const()[name = tensor<string, []>("op_2738_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2738_cast_fp16 = einsum(equation = var_2738_equation_0, values = (var_2524_cast_fp16, var_2684_cast_fp16))[name = tensor<string, []>("op_2738_cast_fp16")];
            tensor<string, []> var_2740_equation_0 = const()[name = tensor<string, []>("op_2740_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2740_cast_fp16 = einsum(equation = var_2740_equation_0, values = (var_2524_cast_fp16, var_2685_cast_fp16))[name = tensor<string, []>("op_2740_cast_fp16")];
            tensor<string, []> var_2742_equation_0 = const()[name = tensor<string, []>("op_2742_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2742_cast_fp16 = einsum(equation = var_2742_equation_0, values = (var_2524_cast_fp16, var_2686_cast_fp16))[name = tensor<string, []>("op_2742_cast_fp16")];
            tensor<string, []> var_2744_equation_0 = const()[name = tensor<string, []>("op_2744_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2744_cast_fp16 = einsum(equation = var_2744_equation_0, values = (var_2528_cast_fp16, var_2687_cast_fp16))[name = tensor<string, []>("op_2744_cast_fp16")];
            tensor<string, []> var_2746_equation_0 = const()[name = tensor<string, []>("op_2746_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2746_cast_fp16 = einsum(equation = var_2746_equation_0, values = (var_2528_cast_fp16, var_2688_cast_fp16))[name = tensor<string, []>("op_2746_cast_fp16")];
            tensor<string, []> var_2748_equation_0 = const()[name = tensor<string, []>("op_2748_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2748_cast_fp16 = einsum(equation = var_2748_equation_0, values = (var_2528_cast_fp16, var_2689_cast_fp16))[name = tensor<string, []>("op_2748_cast_fp16")];
            tensor<string, []> var_2750_equation_0 = const()[name = tensor<string, []>("op_2750_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2750_cast_fp16 = einsum(equation = var_2750_equation_0, values = (var_2528_cast_fp16, var_2690_cast_fp16))[name = tensor<string, []>("op_2750_cast_fp16")];
            tensor<string, []> var_2752_equation_0 = const()[name = tensor<string, []>("op_2752_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2752_cast_fp16 = einsum(equation = var_2752_equation_0, values = (var_2532_cast_fp16, var_2691_cast_fp16))[name = tensor<string, []>("op_2752_cast_fp16")];
            tensor<string, []> var_2754_equation_0 = const()[name = tensor<string, []>("op_2754_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2754_cast_fp16 = einsum(equation = var_2754_equation_0, values = (var_2532_cast_fp16, var_2692_cast_fp16))[name = tensor<string, []>("op_2754_cast_fp16")];
            tensor<string, []> var_2756_equation_0 = const()[name = tensor<string, []>("op_2756_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2756_cast_fp16 = einsum(equation = var_2756_equation_0, values = (var_2532_cast_fp16, var_2693_cast_fp16))[name = tensor<string, []>("op_2756_cast_fp16")];
            tensor<string, []> var_2758_equation_0 = const()[name = tensor<string, []>("op_2758_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_2758_cast_fp16 = einsum(equation = var_2758_equation_0, values = (var_2532_cast_fp16, var_2694_cast_fp16))[name = tensor<string, []>("op_2758_cast_fp16")];
            tensor<bool, []> var_2760_interleave_0 = const()[name = tensor<string, []>("op_2760_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2760_cast_fp16 = concat(axis = var_2147, interleave = var_2760_interleave_0, values = (var_2696_cast_fp16, var_2698_cast_fp16, var_2700_cast_fp16, var_2702_cast_fp16))[name = tensor<string, []>("op_2760_cast_fp16")];
            tensor<bool, []> var_2762_interleave_0 = const()[name = tensor<string, []>("op_2762_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2762_cast_fp16 = concat(axis = var_2147, interleave = var_2762_interleave_0, values = (var_2704_cast_fp16, var_2706_cast_fp16, var_2708_cast_fp16, var_2710_cast_fp16))[name = tensor<string, []>("op_2762_cast_fp16")];
            tensor<bool, []> var_2764_interleave_0 = const()[name = tensor<string, []>("op_2764_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2764_cast_fp16 = concat(axis = var_2147, interleave = var_2764_interleave_0, values = (var_2712_cast_fp16, var_2714_cast_fp16, var_2716_cast_fp16, var_2718_cast_fp16))[name = tensor<string, []>("op_2764_cast_fp16")];
            tensor<bool, []> var_2766_interleave_0 = const()[name = tensor<string, []>("op_2766_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2766_cast_fp16 = concat(axis = var_2147, interleave = var_2766_interleave_0, values = (var_2720_cast_fp16, var_2722_cast_fp16, var_2724_cast_fp16, var_2726_cast_fp16))[name = tensor<string, []>("op_2766_cast_fp16")];
            tensor<bool, []> var_2768_interleave_0 = const()[name = tensor<string, []>("op_2768_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2768_cast_fp16 = concat(axis = var_2147, interleave = var_2768_interleave_0, values = (var_2728_cast_fp16, var_2730_cast_fp16, var_2732_cast_fp16, var_2734_cast_fp16))[name = tensor<string, []>("op_2768_cast_fp16")];
            tensor<bool, []> var_2770_interleave_0 = const()[name = tensor<string, []>("op_2770_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2770_cast_fp16 = concat(axis = var_2147, interleave = var_2770_interleave_0, values = (var_2736_cast_fp16, var_2738_cast_fp16, var_2740_cast_fp16, var_2742_cast_fp16))[name = tensor<string, []>("op_2770_cast_fp16")];
            tensor<bool, []> var_2772_interleave_0 = const()[name = tensor<string, []>("op_2772_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2772_cast_fp16 = concat(axis = var_2147, interleave = var_2772_interleave_0, values = (var_2744_cast_fp16, var_2746_cast_fp16, var_2748_cast_fp16, var_2750_cast_fp16))[name = tensor<string, []>("op_2772_cast_fp16")];
            tensor<bool, []> var_2774_interleave_0 = const()[name = tensor<string, []>("op_2774_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_2774_cast_fp16 = concat(axis = var_2147, interleave = var_2774_interleave_0, values = (var_2752_cast_fp16, var_2754_cast_fp16, var_2756_cast_fp16, var_2758_cast_fp16))[name = tensor<string, []>("op_2774_cast_fp16")];
            tensor<bool, []> input_25_interleave_0 = const()[name = tensor<string, []>("input_25_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 512, 1, 1500]> input_25_cast_fp16 = concat(axis = var_2160, interleave = input_25_interleave_0, values = (var_2760_cast_fp16, var_2762_cast_fp16, var_2764_cast_fp16, var_2766_cast_fp16, var_2768_cast_fp16, var_2770_cast_fp16, var_2772_cast_fp16, var_2774_cast_fp16))[name = tensor<string, []>("input_25_cast_fp16")];
            tensor<int32, [2]> var_2779 = const()[name = tensor<string, []>("op_2779"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2781 = const()[name = tensor<string, []>("op_2781"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_15_pad_type_0 = const()[name = tensor<string, []>("obj_15_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_15_pad_0 = const()[name = tensor<string, []>("obj_15_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_3_self_attn_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_o_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(23850752)))];
            tensor<fp16, [512]> layers_3_self_attn_o_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_self_attn_o_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(24375104)))];
            tensor<fp16, [1, 512, 1, 1500]> obj_15_cast_fp16 = conv(bias = layers_3_self_attn_o_proj_bias_to_fp16, dilations = var_2781, groups = var_2160, pad = obj_15_pad_0, pad_type = obj_15_pad_type_0, strides = var_2779, weight = layers_3_self_attn_o_proj_weight_to_fp16, x = input_25_cast_fp16)[name = tensor<string, []>("obj_15_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_15_cast_fp16 = add(x = inputs_13_cast_fp16, y = obj_15_cast_fp16)[name = tensor<string, []>("inputs_15_cast_fp16")];
            tensor<int32, [1]> var_2787 = const()[name = tensor<string, []>("op_2787"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_15_cast_fp16 = reduce_mean(axes = var_2787, keep_dims = var_2161, x = inputs_15_cast_fp16)[name = tensor<string, []>("channels_mean_15_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_15_cast_fp16 = sub(x = inputs_15_cast_fp16, y = channels_mean_15_cast_fp16)[name = tensor<string, []>("zero_mean_15_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_15_cast_fp16 = mul(x = zero_mean_15_cast_fp16, y = zero_mean_15_cast_fp16)[name = tensor<string, []>("zero_mean_sq_15_cast_fp16")];
            tensor<int32, [1]> var_2791 = const()[name = tensor<string, []>("op_2791"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_2792_cast_fp16 = reduce_mean(axes = var_2791, keep_dims = var_2161, x = zero_mean_sq_15_cast_fp16)[name = tensor<string, []>("op_2792_cast_fp16")];
            tensor<fp16, []> var_2793_to_fp16 = const()[name = tensor<string, []>("op_2793_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_2794_cast_fp16 = add(x = var_2792_cast_fp16, y = var_2793_to_fp16)[name = tensor<string, []>("op_2794_cast_fp16")];
            tensor<fp16, []> denom_15_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_15_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_15_cast_fp16 = rsqrt(epsilon = denom_15_epsilon_0_to_fp16, x = var_2794_cast_fp16)[name = tensor<string, []>("denom_15_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_15_cast_fp16 = mul(x = zero_mean_15_cast_fp16, y = denom_15_cast_fp16)[name = tensor<string, []>("out_15_cast_fp16")];
            tensor<fp16, [512]> input_27_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_27_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(24376192)))];
            tensor<fp16, [512]> input_27_beta_0_to_fp16 = const()[name = tensor<string, []>("input_27_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(24377280)))];
            tensor<fp16, []> input_27_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_27_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> input_27_cast_fp16 = batch_norm(beta = input_27_beta_0_to_fp16, epsilon = input_27_epsilon_0_to_fp16, gamma = input_27_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_15_cast_fp16)[name = tensor<string, []>("input_27_cast_fp16")];
            tensor<int32, [2]> var_2805 = const()[name = tensor<string, []>("op_2805"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2807 = const()[name = tensor<string, []>("op_2807"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> input_29_pad_type_0 = const()[name = tensor<string, []>("input_29_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> input_29_pad_0 = const()[name = tensor<string, []>("input_29_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [2048, 512, 1, 1]> layers_3_fc1_weight_to_fp16 = const()[name = tensor<string, []>("layers_3_fc1_weight_to_fp16"), val = tensor<fp16, [2048, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(24378368)))];
            tensor<fp16, [2048]> layers_3_fc1_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_fc1_bias_to_fp16"), val = tensor<fp16, [2048]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26475584)))];
            tensor<fp16, [1, 2048, 1, 1500]> input_29_cast_fp16 = conv(bias = layers_3_fc1_bias_to_fp16, dilations = var_2807, groups = var_2160, pad = input_29_pad_0, pad_type = input_29_pad_type_0, strides = var_2805, weight = layers_3_fc1_weight_to_fp16, x = input_27_cast_fp16)[name = tensor<string, []>("input_29_cast_fp16")];
            tensor<string, []> input_31_mode_0 = const()[name = tensor<string, []>("input_31_mode_0"), val = tensor<string, []>("EXACT")];
            tensor<fp16, [1, 2048, 1, 1500]> input_31_cast_fp16 = gelu(mode = input_31_mode_0, x = input_29_cast_fp16)[name = tensor<string, []>("input_31_cast_fp16")];
            tensor<int32, [2]> var_2813 = const()[name = tensor<string, []>("op_2813"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2815 = const()[name = tensor<string, []>("op_2815"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> hidden_states_11_pad_type_0 = const()[name = tensor<string, []>("hidden_states_11_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> hidden_states_11_pad_0 = const()[name = tensor<string, []>("hidden_states_11_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 2048, 1, 1]> layers_3_fc2_weight_to_fp16 = const()[name = tensor<string, []>("layers_3_fc2_weight_to_fp16"), val = tensor<fp16, [512, 2048, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(26479744)))];
            tensor<fp16, [512]> layers_3_fc2_bias_to_fp16 = const()[name = tensor<string, []>("layers_3_fc2_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(28576960)))];
            tensor<fp16, [1, 512, 1, 1500]> hidden_states_11_cast_fp16 = conv(bias = layers_3_fc2_bias_to_fp16, dilations = var_2815, groups = var_2160, pad = hidden_states_11_pad_0, pad_type = hidden_states_11_pad_type_0, strides = var_2813, weight = layers_3_fc2_weight_to_fp16, x = input_31_cast_fp16)[name = tensor<string, []>("hidden_states_11_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_17_cast_fp16 = add(x = inputs_15_cast_fp16, y = hidden_states_11_cast_fp16)[name = tensor<string, []>("inputs_17_cast_fp16")];
            tensor<int32, []> var_2822 = const()[name = tensor<string, []>("op_2822"), val = tensor<int32, []>(3)];
            tensor<int32, []> var_2835 = const()[name = tensor<string, []>("op_2835"), val = tensor<int32, []>(1)];
            tensor<bool, []> var_2836 = const()[name = tensor<string, []>("op_2836"), val = tensor<bool, []>(true)];
            tensor<int32, [1]> var_2846 = const()[name = tensor<string, []>("op_2846"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_17_cast_fp16 = reduce_mean(axes = var_2846, keep_dims = var_2836, x = inputs_17_cast_fp16)[name = tensor<string, []>("channels_mean_17_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_17_cast_fp16 = sub(x = inputs_17_cast_fp16, y = channels_mean_17_cast_fp16)[name = tensor<string, []>("zero_mean_17_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_17_cast_fp16 = mul(x = zero_mean_17_cast_fp16, y = zero_mean_17_cast_fp16)[name = tensor<string, []>("zero_mean_sq_17_cast_fp16")];
            tensor<int32, [1]> var_2850 = const()[name = tensor<string, []>("op_2850"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_2851_cast_fp16 = reduce_mean(axes = var_2850, keep_dims = var_2836, x = zero_mean_sq_17_cast_fp16)[name = tensor<string, []>("op_2851_cast_fp16")];
            tensor<fp16, []> var_2852_to_fp16 = const()[name = tensor<string, []>("op_2852_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_2853_cast_fp16 = add(x = var_2851_cast_fp16, y = var_2852_to_fp16)[name = tensor<string, []>("op_2853_cast_fp16")];
            tensor<fp16, []> denom_17_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_17_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_17_cast_fp16 = rsqrt(epsilon = denom_17_epsilon_0_to_fp16, x = var_2853_cast_fp16)[name = tensor<string, []>("denom_17_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_17_cast_fp16 = mul(x = zero_mean_17_cast_fp16, y = denom_17_cast_fp16)[name = tensor<string, []>("out_17_cast_fp16")];
            tensor<fp16, [512]> obj_17_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_17_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(28578048)))];
            tensor<fp16, [512]> obj_17_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_17_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(28579136)))];
            tensor<fp16, []> obj_17_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_17_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> obj_17_cast_fp16 = batch_norm(beta = obj_17_beta_0_to_fp16, epsilon = obj_17_epsilon_0_to_fp16, gamma = obj_17_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_17_cast_fp16)[name = tensor<string, []>("obj_17_cast_fp16")];
            tensor<int32, [2]> var_2868 = const()[name = tensor<string, []>("op_2868"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2870 = const()[name = tensor<string, []>("op_2870"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_9_pad_type_0 = const()[name = tensor<string, []>("query_9_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_9_pad_0 = const()[name = tensor<string, []>("query_9_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_4_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_4_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(28580224)))];
            tensor<fp16, [512]> layers_4_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_4_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(29104576)))];
            tensor<fp16, [1, 512, 1, 1500]> query_9_cast_fp16 = conv(bias = layers_4_self_attn_q_proj_bias_to_fp16, dilations = var_2870, groups = var_2835, pad = query_9_pad_0, pad_type = query_9_pad_type_0, strides = var_2868, weight = layers_4_self_attn_q_proj_weight_to_fp16, x = obj_17_cast_fp16)[name = tensor<string, []>("query_9_cast_fp16")];
            tensor<int32, [2]> var_2874 = const()[name = tensor<string, []>("op_2874"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2876 = const()[name = tensor<string, []>("op_2876"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_9_pad_type_0 = const()[name = tensor<string, []>("key_9_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_9_pad_0 = const()[name = tensor<string, []>("key_9_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_4_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_4_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(29105664)))];
            tensor<fp16, [1, 512, 1, 1500]> key_9_cast_fp16 = conv(dilations = var_2876, groups = var_2835, pad = key_9_pad_0, pad_type = key_9_pad_type_0, strides = var_2874, weight = layers_4_self_attn_k_proj_weight_to_fp16, x = obj_17_cast_fp16)[name = tensor<string, []>("key_9_cast_fp16")];
            tensor<int32, [2]> var_2881 = const()[name = tensor<string, []>("op_2881"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_2883 = const()[name = tensor<string, []>("op_2883"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_9_pad_type_0 = const()[name = tensor<string, []>("value_9_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_9_pad_0 = const()[name = tensor<string, []>("value_9_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_4_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_4_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(29630016)))];
            tensor<fp16, [512]> layers_4_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_4_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30154368)))];
            tensor<fp16, [1, 512, 1, 1500]> value_9_cast_fp16 = conv(bias = layers_4_self_attn_v_proj_bias_to_fp16, dilations = var_2883, groups = var_2835, pad = value_9_pad_0, pad_type = value_9_pad_type_0, strides = var_2881, weight = layers_4_self_attn_v_proj_weight_to_fp16, x = obj_17_cast_fp16)[name = tensor<string, []>("value_9_cast_fp16")];
            tensor<int32, [4]> var_2890_begin_0 = const()[name = tensor<string, []>("op_2890_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2890_end_0 = const()[name = tensor<string, []>("op_2890_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2890_end_mask_0 = const()[name = tensor<string, []>("op_2890_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2890_cast_fp16 = slice_by_index(begin = var_2890_begin_0, end = var_2890_end_0, end_mask = var_2890_end_mask_0, x = query_9_cast_fp16)[name = tensor<string, []>("op_2890_cast_fp16")];
            tensor<int32, [4]> var_2894_begin_0 = const()[name = tensor<string, []>("op_2894_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_2894_end_0 = const()[name = tensor<string, []>("op_2894_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_2894_end_mask_0 = const()[name = tensor<string, []>("op_2894_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2894_cast_fp16 = slice_by_index(begin = var_2894_begin_0, end = var_2894_end_0, end_mask = var_2894_end_mask_0, x = query_9_cast_fp16)[name = tensor<string, []>("op_2894_cast_fp16")];
            tensor<int32, [4]> var_2898_begin_0 = const()[name = tensor<string, []>("op_2898_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_2898_end_0 = const()[name = tensor<string, []>("op_2898_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_2898_end_mask_0 = const()[name = tensor<string, []>("op_2898_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2898_cast_fp16 = slice_by_index(begin = var_2898_begin_0, end = var_2898_end_0, end_mask = var_2898_end_mask_0, x = query_9_cast_fp16)[name = tensor<string, []>("op_2898_cast_fp16")];
            tensor<int32, [4]> var_2902_begin_0 = const()[name = tensor<string, []>("op_2902_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_2902_end_0 = const()[name = tensor<string, []>("op_2902_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_2902_end_mask_0 = const()[name = tensor<string, []>("op_2902_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2902_cast_fp16 = slice_by_index(begin = var_2902_begin_0, end = var_2902_end_0, end_mask = var_2902_end_mask_0, x = query_9_cast_fp16)[name = tensor<string, []>("op_2902_cast_fp16")];
            tensor<int32, [4]> var_2906_begin_0 = const()[name = tensor<string, []>("op_2906_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_2906_end_0 = const()[name = tensor<string, []>("op_2906_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_2906_end_mask_0 = const()[name = tensor<string, []>("op_2906_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2906_cast_fp16 = slice_by_index(begin = var_2906_begin_0, end = var_2906_end_0, end_mask = var_2906_end_mask_0, x = query_9_cast_fp16)[name = tensor<string, []>("op_2906_cast_fp16")];
            tensor<int32, [4]> var_2910_begin_0 = const()[name = tensor<string, []>("op_2910_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_2910_end_0 = const()[name = tensor<string, []>("op_2910_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_2910_end_mask_0 = const()[name = tensor<string, []>("op_2910_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2910_cast_fp16 = slice_by_index(begin = var_2910_begin_0, end = var_2910_end_0, end_mask = var_2910_end_mask_0, x = query_9_cast_fp16)[name = tensor<string, []>("op_2910_cast_fp16")];
            tensor<int32, [4]> var_2914_begin_0 = const()[name = tensor<string, []>("op_2914_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_2914_end_0 = const()[name = tensor<string, []>("op_2914_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_2914_end_mask_0 = const()[name = tensor<string, []>("op_2914_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2914_cast_fp16 = slice_by_index(begin = var_2914_begin_0, end = var_2914_end_0, end_mask = var_2914_end_mask_0, x = query_9_cast_fp16)[name = tensor<string, []>("op_2914_cast_fp16")];
            tensor<int32, [4]> var_2918_begin_0 = const()[name = tensor<string, []>("op_2918_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_2918_end_0 = const()[name = tensor<string, []>("op_2918_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_2918_end_mask_0 = const()[name = tensor<string, []>("op_2918_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_2918_cast_fp16 = slice_by_index(begin = var_2918_begin_0, end = var_2918_end_0, end_mask = var_2918_end_mask_0, x = query_9_cast_fp16)[name = tensor<string, []>("op_2918_cast_fp16")];
            tensor<int32, [4]> var_2927_begin_0 = const()[name = tensor<string, []>("op_2927_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2927_end_0 = const()[name = tensor<string, []>("op_2927_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_2927_end_mask_0 = const()[name = tensor<string, []>("op_2927_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2927_cast_fp16 = slice_by_index(begin = var_2927_begin_0, end = var_2927_end_0, end_mask = var_2927_end_mask_0, x = var_2890_cast_fp16)[name = tensor<string, []>("op_2927_cast_fp16")];
            tensor<int32, [4]> var_2934_begin_0 = const()[name = tensor<string, []>("op_2934_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_2934_end_0 = const()[name = tensor<string, []>("op_2934_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_2934_end_mask_0 = const()[name = tensor<string, []>("op_2934_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2934_cast_fp16 = slice_by_index(begin = var_2934_begin_0, end = var_2934_end_0, end_mask = var_2934_end_mask_0, x = var_2890_cast_fp16)[name = tensor<string, []>("op_2934_cast_fp16")];
            tensor<int32, [4]> var_2941_begin_0 = const()[name = tensor<string, []>("op_2941_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_2941_end_0 = const()[name = tensor<string, []>("op_2941_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_2941_end_mask_0 = const()[name = tensor<string, []>("op_2941_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2941_cast_fp16 = slice_by_index(begin = var_2941_begin_0, end = var_2941_end_0, end_mask = var_2941_end_mask_0, x = var_2890_cast_fp16)[name = tensor<string, []>("op_2941_cast_fp16")];
            tensor<int32, [4]> var_2948_begin_0 = const()[name = tensor<string, []>("op_2948_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_2948_end_0 = const()[name = tensor<string, []>("op_2948_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2948_end_mask_0 = const()[name = tensor<string, []>("op_2948_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2948_cast_fp16 = slice_by_index(begin = var_2948_begin_0, end = var_2948_end_0, end_mask = var_2948_end_mask_0, x = var_2890_cast_fp16)[name = tensor<string, []>("op_2948_cast_fp16")];
            tensor<int32, [4]> var_2955_begin_0 = const()[name = tensor<string, []>("op_2955_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2955_end_0 = const()[name = tensor<string, []>("op_2955_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_2955_end_mask_0 = const()[name = tensor<string, []>("op_2955_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2955_cast_fp16 = slice_by_index(begin = var_2955_begin_0, end = var_2955_end_0, end_mask = var_2955_end_mask_0, x = var_2894_cast_fp16)[name = tensor<string, []>("op_2955_cast_fp16")];
            tensor<int32, [4]> var_2962_begin_0 = const()[name = tensor<string, []>("op_2962_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_2962_end_0 = const()[name = tensor<string, []>("op_2962_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_2962_end_mask_0 = const()[name = tensor<string, []>("op_2962_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2962_cast_fp16 = slice_by_index(begin = var_2962_begin_0, end = var_2962_end_0, end_mask = var_2962_end_mask_0, x = var_2894_cast_fp16)[name = tensor<string, []>("op_2962_cast_fp16")];
            tensor<int32, [4]> var_2969_begin_0 = const()[name = tensor<string, []>("op_2969_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_2969_end_0 = const()[name = tensor<string, []>("op_2969_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_2969_end_mask_0 = const()[name = tensor<string, []>("op_2969_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2969_cast_fp16 = slice_by_index(begin = var_2969_begin_0, end = var_2969_end_0, end_mask = var_2969_end_mask_0, x = var_2894_cast_fp16)[name = tensor<string, []>("op_2969_cast_fp16")];
            tensor<int32, [4]> var_2976_begin_0 = const()[name = tensor<string, []>("op_2976_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_2976_end_0 = const()[name = tensor<string, []>("op_2976_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_2976_end_mask_0 = const()[name = tensor<string, []>("op_2976_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2976_cast_fp16 = slice_by_index(begin = var_2976_begin_0, end = var_2976_end_0, end_mask = var_2976_end_mask_0, x = var_2894_cast_fp16)[name = tensor<string, []>("op_2976_cast_fp16")];
            tensor<int32, [4]> var_2983_begin_0 = const()[name = tensor<string, []>("op_2983_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_2983_end_0 = const()[name = tensor<string, []>("op_2983_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_2983_end_mask_0 = const()[name = tensor<string, []>("op_2983_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2983_cast_fp16 = slice_by_index(begin = var_2983_begin_0, end = var_2983_end_0, end_mask = var_2983_end_mask_0, x = var_2898_cast_fp16)[name = tensor<string, []>("op_2983_cast_fp16")];
            tensor<int32, [4]> var_2990_begin_0 = const()[name = tensor<string, []>("op_2990_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_2990_end_0 = const()[name = tensor<string, []>("op_2990_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_2990_end_mask_0 = const()[name = tensor<string, []>("op_2990_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2990_cast_fp16 = slice_by_index(begin = var_2990_begin_0, end = var_2990_end_0, end_mask = var_2990_end_mask_0, x = var_2898_cast_fp16)[name = tensor<string, []>("op_2990_cast_fp16")];
            tensor<int32, [4]> var_2997_begin_0 = const()[name = tensor<string, []>("op_2997_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_2997_end_0 = const()[name = tensor<string, []>("op_2997_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_2997_end_mask_0 = const()[name = tensor<string, []>("op_2997_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_2997_cast_fp16 = slice_by_index(begin = var_2997_begin_0, end = var_2997_end_0, end_mask = var_2997_end_mask_0, x = var_2898_cast_fp16)[name = tensor<string, []>("op_2997_cast_fp16")];
            tensor<int32, [4]> var_3004_begin_0 = const()[name = tensor<string, []>("op_3004_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3004_end_0 = const()[name = tensor<string, []>("op_3004_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3004_end_mask_0 = const()[name = tensor<string, []>("op_3004_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3004_cast_fp16 = slice_by_index(begin = var_3004_begin_0, end = var_3004_end_0, end_mask = var_3004_end_mask_0, x = var_2898_cast_fp16)[name = tensor<string, []>("op_3004_cast_fp16")];
            tensor<int32, [4]> var_3011_begin_0 = const()[name = tensor<string, []>("op_3011_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3011_end_0 = const()[name = tensor<string, []>("op_3011_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3011_end_mask_0 = const()[name = tensor<string, []>("op_3011_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3011_cast_fp16 = slice_by_index(begin = var_3011_begin_0, end = var_3011_end_0, end_mask = var_3011_end_mask_0, x = var_2902_cast_fp16)[name = tensor<string, []>("op_3011_cast_fp16")];
            tensor<int32, [4]> var_3018_begin_0 = const()[name = tensor<string, []>("op_3018_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3018_end_0 = const()[name = tensor<string, []>("op_3018_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3018_end_mask_0 = const()[name = tensor<string, []>("op_3018_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3018_cast_fp16 = slice_by_index(begin = var_3018_begin_0, end = var_3018_end_0, end_mask = var_3018_end_mask_0, x = var_2902_cast_fp16)[name = tensor<string, []>("op_3018_cast_fp16")];
            tensor<int32, [4]> var_3025_begin_0 = const()[name = tensor<string, []>("op_3025_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3025_end_0 = const()[name = tensor<string, []>("op_3025_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3025_end_mask_0 = const()[name = tensor<string, []>("op_3025_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3025_cast_fp16 = slice_by_index(begin = var_3025_begin_0, end = var_3025_end_0, end_mask = var_3025_end_mask_0, x = var_2902_cast_fp16)[name = tensor<string, []>("op_3025_cast_fp16")];
            tensor<int32, [4]> var_3032_begin_0 = const()[name = tensor<string, []>("op_3032_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3032_end_0 = const()[name = tensor<string, []>("op_3032_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3032_end_mask_0 = const()[name = tensor<string, []>("op_3032_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3032_cast_fp16 = slice_by_index(begin = var_3032_begin_0, end = var_3032_end_0, end_mask = var_3032_end_mask_0, x = var_2902_cast_fp16)[name = tensor<string, []>("op_3032_cast_fp16")];
            tensor<int32, [4]> var_3039_begin_0 = const()[name = tensor<string, []>("op_3039_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3039_end_0 = const()[name = tensor<string, []>("op_3039_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3039_end_mask_0 = const()[name = tensor<string, []>("op_3039_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3039_cast_fp16 = slice_by_index(begin = var_3039_begin_0, end = var_3039_end_0, end_mask = var_3039_end_mask_0, x = var_2906_cast_fp16)[name = tensor<string, []>("op_3039_cast_fp16")];
            tensor<int32, [4]> var_3046_begin_0 = const()[name = tensor<string, []>("op_3046_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3046_end_0 = const()[name = tensor<string, []>("op_3046_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3046_end_mask_0 = const()[name = tensor<string, []>("op_3046_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3046_cast_fp16 = slice_by_index(begin = var_3046_begin_0, end = var_3046_end_0, end_mask = var_3046_end_mask_0, x = var_2906_cast_fp16)[name = tensor<string, []>("op_3046_cast_fp16")];
            tensor<int32, [4]> var_3053_begin_0 = const()[name = tensor<string, []>("op_3053_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3053_end_0 = const()[name = tensor<string, []>("op_3053_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3053_end_mask_0 = const()[name = tensor<string, []>("op_3053_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3053_cast_fp16 = slice_by_index(begin = var_3053_begin_0, end = var_3053_end_0, end_mask = var_3053_end_mask_0, x = var_2906_cast_fp16)[name = tensor<string, []>("op_3053_cast_fp16")];
            tensor<int32, [4]> var_3060_begin_0 = const()[name = tensor<string, []>("op_3060_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3060_end_0 = const()[name = tensor<string, []>("op_3060_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3060_end_mask_0 = const()[name = tensor<string, []>("op_3060_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3060_cast_fp16 = slice_by_index(begin = var_3060_begin_0, end = var_3060_end_0, end_mask = var_3060_end_mask_0, x = var_2906_cast_fp16)[name = tensor<string, []>("op_3060_cast_fp16")];
            tensor<int32, [4]> var_3067_begin_0 = const()[name = tensor<string, []>("op_3067_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3067_end_0 = const()[name = tensor<string, []>("op_3067_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3067_end_mask_0 = const()[name = tensor<string, []>("op_3067_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3067_cast_fp16 = slice_by_index(begin = var_3067_begin_0, end = var_3067_end_0, end_mask = var_3067_end_mask_0, x = var_2910_cast_fp16)[name = tensor<string, []>("op_3067_cast_fp16")];
            tensor<int32, [4]> var_3074_begin_0 = const()[name = tensor<string, []>("op_3074_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3074_end_0 = const()[name = tensor<string, []>("op_3074_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3074_end_mask_0 = const()[name = tensor<string, []>("op_3074_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3074_cast_fp16 = slice_by_index(begin = var_3074_begin_0, end = var_3074_end_0, end_mask = var_3074_end_mask_0, x = var_2910_cast_fp16)[name = tensor<string, []>("op_3074_cast_fp16")];
            tensor<int32, [4]> var_3081_begin_0 = const()[name = tensor<string, []>("op_3081_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3081_end_0 = const()[name = tensor<string, []>("op_3081_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3081_end_mask_0 = const()[name = tensor<string, []>("op_3081_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3081_cast_fp16 = slice_by_index(begin = var_3081_begin_0, end = var_3081_end_0, end_mask = var_3081_end_mask_0, x = var_2910_cast_fp16)[name = tensor<string, []>("op_3081_cast_fp16")];
            tensor<int32, [4]> var_3088_begin_0 = const()[name = tensor<string, []>("op_3088_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3088_end_0 = const()[name = tensor<string, []>("op_3088_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3088_end_mask_0 = const()[name = tensor<string, []>("op_3088_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3088_cast_fp16 = slice_by_index(begin = var_3088_begin_0, end = var_3088_end_0, end_mask = var_3088_end_mask_0, x = var_2910_cast_fp16)[name = tensor<string, []>("op_3088_cast_fp16")];
            tensor<int32, [4]> var_3095_begin_0 = const()[name = tensor<string, []>("op_3095_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3095_end_0 = const()[name = tensor<string, []>("op_3095_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3095_end_mask_0 = const()[name = tensor<string, []>("op_3095_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3095_cast_fp16 = slice_by_index(begin = var_3095_begin_0, end = var_3095_end_0, end_mask = var_3095_end_mask_0, x = var_2914_cast_fp16)[name = tensor<string, []>("op_3095_cast_fp16")];
            tensor<int32, [4]> var_3102_begin_0 = const()[name = tensor<string, []>("op_3102_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3102_end_0 = const()[name = tensor<string, []>("op_3102_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3102_end_mask_0 = const()[name = tensor<string, []>("op_3102_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3102_cast_fp16 = slice_by_index(begin = var_3102_begin_0, end = var_3102_end_0, end_mask = var_3102_end_mask_0, x = var_2914_cast_fp16)[name = tensor<string, []>("op_3102_cast_fp16")];
            tensor<int32, [4]> var_3109_begin_0 = const()[name = tensor<string, []>("op_3109_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3109_end_0 = const()[name = tensor<string, []>("op_3109_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3109_end_mask_0 = const()[name = tensor<string, []>("op_3109_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3109_cast_fp16 = slice_by_index(begin = var_3109_begin_0, end = var_3109_end_0, end_mask = var_3109_end_mask_0, x = var_2914_cast_fp16)[name = tensor<string, []>("op_3109_cast_fp16")];
            tensor<int32, [4]> var_3116_begin_0 = const()[name = tensor<string, []>("op_3116_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3116_end_0 = const()[name = tensor<string, []>("op_3116_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3116_end_mask_0 = const()[name = tensor<string, []>("op_3116_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3116_cast_fp16 = slice_by_index(begin = var_3116_begin_0, end = var_3116_end_0, end_mask = var_3116_end_mask_0, x = var_2914_cast_fp16)[name = tensor<string, []>("op_3116_cast_fp16")];
            tensor<int32, [4]> var_3123_begin_0 = const()[name = tensor<string, []>("op_3123_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3123_end_0 = const()[name = tensor<string, []>("op_3123_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3123_end_mask_0 = const()[name = tensor<string, []>("op_3123_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3123_cast_fp16 = slice_by_index(begin = var_3123_begin_0, end = var_3123_end_0, end_mask = var_3123_end_mask_0, x = var_2918_cast_fp16)[name = tensor<string, []>("op_3123_cast_fp16")];
            tensor<int32, [4]> var_3130_begin_0 = const()[name = tensor<string, []>("op_3130_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3130_end_0 = const()[name = tensor<string, []>("op_3130_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3130_end_mask_0 = const()[name = tensor<string, []>("op_3130_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3130_cast_fp16 = slice_by_index(begin = var_3130_begin_0, end = var_3130_end_0, end_mask = var_3130_end_mask_0, x = var_2918_cast_fp16)[name = tensor<string, []>("op_3130_cast_fp16")];
            tensor<int32, [4]> var_3137_begin_0 = const()[name = tensor<string, []>("op_3137_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3137_end_0 = const()[name = tensor<string, []>("op_3137_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3137_end_mask_0 = const()[name = tensor<string, []>("op_3137_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3137_cast_fp16 = slice_by_index(begin = var_3137_begin_0, end = var_3137_end_0, end_mask = var_3137_end_mask_0, x = var_2918_cast_fp16)[name = tensor<string, []>("op_3137_cast_fp16")];
            tensor<int32, [4]> var_3144_begin_0 = const()[name = tensor<string, []>("op_3144_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3144_end_0 = const()[name = tensor<string, []>("op_3144_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3144_end_mask_0 = const()[name = tensor<string, []>("op_3144_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3144_cast_fp16 = slice_by_index(begin = var_3144_begin_0, end = var_3144_end_0, end_mask = var_3144_end_mask_0, x = var_2918_cast_fp16)[name = tensor<string, []>("op_3144_cast_fp16")];
            tensor<int32, [4]> k_9_perm_0 = const()[name = tensor<string, []>("k_9_perm_0"), val = tensor<int32, [4]>([0, 3, 2, 1])];
            tensor<int32, [4]> var_3149_begin_0 = const()[name = tensor<string, []>("op_3149_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3149_end_0 = const()[name = tensor<string, []>("op_3149_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 64])];
            tensor<bool, [4]> var_3149_end_mask_0 = const()[name = tensor<string, []>("op_3149_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 512]> transpose_1 = transpose(perm = k_9_perm_0, x = key_9_cast_fp16)[name = tensor<string, []>("transpose_1")];
            tensor<fp16, [1, 1500, 1, 64]> var_3149_cast_fp16 = slice_by_index(begin = var_3149_begin_0, end = var_3149_end_0, end_mask = var_3149_end_mask_0, x = transpose_1)[name = tensor<string, []>("op_3149_cast_fp16")];
            tensor<int32, [4]> var_3153_begin_0 = const()[name = tensor<string, []>("op_3153_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 64])];
            tensor<int32, [4]> var_3153_end_0 = const()[name = tensor<string, []>("op_3153_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 128])];
            tensor<bool, [4]> var_3153_end_mask_0 = const()[name = tensor<string, []>("op_3153_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3153_cast_fp16 = slice_by_index(begin = var_3153_begin_0, end = var_3153_end_0, end_mask = var_3153_end_mask_0, x = transpose_1)[name = tensor<string, []>("op_3153_cast_fp16")];
            tensor<int32, [4]> var_3157_begin_0 = const()[name = tensor<string, []>("op_3157_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 128])];
            tensor<int32, [4]> var_3157_end_0 = const()[name = tensor<string, []>("op_3157_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 192])];
            tensor<bool, [4]> var_3157_end_mask_0 = const()[name = tensor<string, []>("op_3157_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3157_cast_fp16 = slice_by_index(begin = var_3157_begin_0, end = var_3157_end_0, end_mask = var_3157_end_mask_0, x = transpose_1)[name = tensor<string, []>("op_3157_cast_fp16")];
            tensor<int32, [4]> var_3161_begin_0 = const()[name = tensor<string, []>("op_3161_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 192])];
            tensor<int32, [4]> var_3161_end_0 = const()[name = tensor<string, []>("op_3161_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 256])];
            tensor<bool, [4]> var_3161_end_mask_0 = const()[name = tensor<string, []>("op_3161_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3161_cast_fp16 = slice_by_index(begin = var_3161_begin_0, end = var_3161_end_0, end_mask = var_3161_end_mask_0, x = transpose_1)[name = tensor<string, []>("op_3161_cast_fp16")];
            tensor<int32, [4]> var_3165_begin_0 = const()[name = tensor<string, []>("op_3165_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 256])];
            tensor<int32, [4]> var_3165_end_0 = const()[name = tensor<string, []>("op_3165_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 320])];
            tensor<bool, [4]> var_3165_end_mask_0 = const()[name = tensor<string, []>("op_3165_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3165_cast_fp16 = slice_by_index(begin = var_3165_begin_0, end = var_3165_end_0, end_mask = var_3165_end_mask_0, x = transpose_1)[name = tensor<string, []>("op_3165_cast_fp16")];
            tensor<int32, [4]> var_3169_begin_0 = const()[name = tensor<string, []>("op_3169_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 320])];
            tensor<int32, [4]> var_3169_end_0 = const()[name = tensor<string, []>("op_3169_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 384])];
            tensor<bool, [4]> var_3169_end_mask_0 = const()[name = tensor<string, []>("op_3169_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3169_cast_fp16 = slice_by_index(begin = var_3169_begin_0, end = var_3169_end_0, end_mask = var_3169_end_mask_0, x = transpose_1)[name = tensor<string, []>("op_3169_cast_fp16")];
            tensor<int32, [4]> var_3173_begin_0 = const()[name = tensor<string, []>("op_3173_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 384])];
            tensor<int32, [4]> var_3173_end_0 = const()[name = tensor<string, []>("op_3173_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 448])];
            tensor<bool, [4]> var_3173_end_mask_0 = const()[name = tensor<string, []>("op_3173_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3173_cast_fp16 = slice_by_index(begin = var_3173_begin_0, end = var_3173_end_0, end_mask = var_3173_end_mask_0, x = transpose_1)[name = tensor<string, []>("op_3173_cast_fp16")];
            tensor<int32, [4]> var_3177_begin_0 = const()[name = tensor<string, []>("op_3177_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 448])];
            tensor<int32, [4]> var_3177_end_0 = const()[name = tensor<string, []>("op_3177_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 512])];
            tensor<bool, [4]> var_3177_end_mask_0 = const()[name = tensor<string, []>("op_3177_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3177_cast_fp16 = slice_by_index(begin = var_3177_begin_0, end = var_3177_end_0, end_mask = var_3177_end_mask_0, x = transpose_1)[name = tensor<string, []>("op_3177_cast_fp16")];
            tensor<int32, [4]> var_3179_begin_0 = const()[name = tensor<string, []>("op_3179_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3179_end_0 = const()[name = tensor<string, []>("op_3179_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3179_end_mask_0 = const()[name = tensor<string, []>("op_3179_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3179_cast_fp16 = slice_by_index(begin = var_3179_begin_0, end = var_3179_end_0, end_mask = var_3179_end_mask_0, x = value_9_cast_fp16)[name = tensor<string, []>("op_3179_cast_fp16")];
            tensor<int32, [4]> var_3183_begin_0 = const()[name = tensor<string, []>("op_3183_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_3183_end_0 = const()[name = tensor<string, []>("op_3183_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_3183_end_mask_0 = const()[name = tensor<string, []>("op_3183_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3183_cast_fp16 = slice_by_index(begin = var_3183_begin_0, end = var_3183_end_0, end_mask = var_3183_end_mask_0, x = value_9_cast_fp16)[name = tensor<string, []>("op_3183_cast_fp16")];
            tensor<int32, [4]> var_3187_begin_0 = const()[name = tensor<string, []>("op_3187_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_3187_end_0 = const()[name = tensor<string, []>("op_3187_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_3187_end_mask_0 = const()[name = tensor<string, []>("op_3187_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3187_cast_fp16 = slice_by_index(begin = var_3187_begin_0, end = var_3187_end_0, end_mask = var_3187_end_mask_0, x = value_9_cast_fp16)[name = tensor<string, []>("op_3187_cast_fp16")];
            tensor<int32, [4]> var_3191_begin_0 = const()[name = tensor<string, []>("op_3191_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_3191_end_0 = const()[name = tensor<string, []>("op_3191_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_3191_end_mask_0 = const()[name = tensor<string, []>("op_3191_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3191_cast_fp16 = slice_by_index(begin = var_3191_begin_0, end = var_3191_end_0, end_mask = var_3191_end_mask_0, x = value_9_cast_fp16)[name = tensor<string, []>("op_3191_cast_fp16")];
            tensor<int32, [4]> var_3195_begin_0 = const()[name = tensor<string, []>("op_3195_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_3195_end_0 = const()[name = tensor<string, []>("op_3195_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_3195_end_mask_0 = const()[name = tensor<string, []>("op_3195_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3195_cast_fp16 = slice_by_index(begin = var_3195_begin_0, end = var_3195_end_0, end_mask = var_3195_end_mask_0, x = value_9_cast_fp16)[name = tensor<string, []>("op_3195_cast_fp16")];
            tensor<int32, [4]> var_3199_begin_0 = const()[name = tensor<string, []>("op_3199_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_3199_end_0 = const()[name = tensor<string, []>("op_3199_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_3199_end_mask_0 = const()[name = tensor<string, []>("op_3199_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3199_cast_fp16 = slice_by_index(begin = var_3199_begin_0, end = var_3199_end_0, end_mask = var_3199_end_mask_0, x = value_9_cast_fp16)[name = tensor<string, []>("op_3199_cast_fp16")];
            tensor<int32, [4]> var_3203_begin_0 = const()[name = tensor<string, []>("op_3203_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_3203_end_0 = const()[name = tensor<string, []>("op_3203_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_3203_end_mask_0 = const()[name = tensor<string, []>("op_3203_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3203_cast_fp16 = slice_by_index(begin = var_3203_begin_0, end = var_3203_end_0, end_mask = var_3203_end_mask_0, x = value_9_cast_fp16)[name = tensor<string, []>("op_3203_cast_fp16")];
            tensor<int32, [4]> var_3207_begin_0 = const()[name = tensor<string, []>("op_3207_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_3207_end_0 = const()[name = tensor<string, []>("op_3207_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_3207_end_mask_0 = const()[name = tensor<string, []>("op_3207_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3207_cast_fp16 = slice_by_index(begin = var_3207_begin_0, end = var_3207_end_0, end_mask = var_3207_end_mask_0, x = value_9_cast_fp16)[name = tensor<string, []>("op_3207_cast_fp16")];
            tensor<string, []> var_3211_equation_0 = const()[name = tensor<string, []>("op_3211_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3211_cast_fp16 = einsum(equation = var_3211_equation_0, values = (var_3149_cast_fp16, var_2927_cast_fp16))[name = tensor<string, []>("op_3211_cast_fp16")];
            tensor<fp16, []> var_3212_to_fp16 = const()[name = tensor<string, []>("op_3212_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_257_cast_fp16 = mul(x = var_3211_cast_fp16, y = var_3212_to_fp16)[name = tensor<string, []>("aw_chunk_257_cast_fp16")];
            tensor<string, []> var_3215_equation_0 = const()[name = tensor<string, []>("op_3215_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3215_cast_fp16 = einsum(equation = var_3215_equation_0, values = (var_3149_cast_fp16, var_2934_cast_fp16))[name = tensor<string, []>("op_3215_cast_fp16")];
            tensor<fp16, []> var_3216_to_fp16 = const()[name = tensor<string, []>("op_3216_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_259_cast_fp16 = mul(x = var_3215_cast_fp16, y = var_3216_to_fp16)[name = tensor<string, []>("aw_chunk_259_cast_fp16")];
            tensor<string, []> var_3219_equation_0 = const()[name = tensor<string, []>("op_3219_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3219_cast_fp16 = einsum(equation = var_3219_equation_0, values = (var_3149_cast_fp16, var_2941_cast_fp16))[name = tensor<string, []>("op_3219_cast_fp16")];
            tensor<fp16, []> var_3220_to_fp16 = const()[name = tensor<string, []>("op_3220_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_261_cast_fp16 = mul(x = var_3219_cast_fp16, y = var_3220_to_fp16)[name = tensor<string, []>("aw_chunk_261_cast_fp16")];
            tensor<string, []> var_3223_equation_0 = const()[name = tensor<string, []>("op_3223_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3223_cast_fp16 = einsum(equation = var_3223_equation_0, values = (var_3149_cast_fp16, var_2948_cast_fp16))[name = tensor<string, []>("op_3223_cast_fp16")];
            tensor<fp16, []> var_3224_to_fp16 = const()[name = tensor<string, []>("op_3224_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_263_cast_fp16 = mul(x = var_3223_cast_fp16, y = var_3224_to_fp16)[name = tensor<string, []>("aw_chunk_263_cast_fp16")];
            tensor<string, []> var_3227_equation_0 = const()[name = tensor<string, []>("op_3227_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3227_cast_fp16 = einsum(equation = var_3227_equation_0, values = (var_3153_cast_fp16, var_2955_cast_fp16))[name = tensor<string, []>("op_3227_cast_fp16")];
            tensor<fp16, []> var_3228_to_fp16 = const()[name = tensor<string, []>("op_3228_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_265_cast_fp16 = mul(x = var_3227_cast_fp16, y = var_3228_to_fp16)[name = tensor<string, []>("aw_chunk_265_cast_fp16")];
            tensor<string, []> var_3231_equation_0 = const()[name = tensor<string, []>("op_3231_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3231_cast_fp16 = einsum(equation = var_3231_equation_0, values = (var_3153_cast_fp16, var_2962_cast_fp16))[name = tensor<string, []>("op_3231_cast_fp16")];
            tensor<fp16, []> var_3232_to_fp16 = const()[name = tensor<string, []>("op_3232_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_267_cast_fp16 = mul(x = var_3231_cast_fp16, y = var_3232_to_fp16)[name = tensor<string, []>("aw_chunk_267_cast_fp16")];
            tensor<string, []> var_3235_equation_0 = const()[name = tensor<string, []>("op_3235_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3235_cast_fp16 = einsum(equation = var_3235_equation_0, values = (var_3153_cast_fp16, var_2969_cast_fp16))[name = tensor<string, []>("op_3235_cast_fp16")];
            tensor<fp16, []> var_3236_to_fp16 = const()[name = tensor<string, []>("op_3236_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_269_cast_fp16 = mul(x = var_3235_cast_fp16, y = var_3236_to_fp16)[name = tensor<string, []>("aw_chunk_269_cast_fp16")];
            tensor<string, []> var_3239_equation_0 = const()[name = tensor<string, []>("op_3239_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3239_cast_fp16 = einsum(equation = var_3239_equation_0, values = (var_3153_cast_fp16, var_2976_cast_fp16))[name = tensor<string, []>("op_3239_cast_fp16")];
            tensor<fp16, []> var_3240_to_fp16 = const()[name = tensor<string, []>("op_3240_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_271_cast_fp16 = mul(x = var_3239_cast_fp16, y = var_3240_to_fp16)[name = tensor<string, []>("aw_chunk_271_cast_fp16")];
            tensor<string, []> var_3243_equation_0 = const()[name = tensor<string, []>("op_3243_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3243_cast_fp16 = einsum(equation = var_3243_equation_0, values = (var_3157_cast_fp16, var_2983_cast_fp16))[name = tensor<string, []>("op_3243_cast_fp16")];
            tensor<fp16, []> var_3244_to_fp16 = const()[name = tensor<string, []>("op_3244_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_273_cast_fp16 = mul(x = var_3243_cast_fp16, y = var_3244_to_fp16)[name = tensor<string, []>("aw_chunk_273_cast_fp16")];
            tensor<string, []> var_3247_equation_0 = const()[name = tensor<string, []>("op_3247_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3247_cast_fp16 = einsum(equation = var_3247_equation_0, values = (var_3157_cast_fp16, var_2990_cast_fp16))[name = tensor<string, []>("op_3247_cast_fp16")];
            tensor<fp16, []> var_3248_to_fp16 = const()[name = tensor<string, []>("op_3248_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_275_cast_fp16 = mul(x = var_3247_cast_fp16, y = var_3248_to_fp16)[name = tensor<string, []>("aw_chunk_275_cast_fp16")];
            tensor<string, []> var_3251_equation_0 = const()[name = tensor<string, []>("op_3251_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3251_cast_fp16 = einsum(equation = var_3251_equation_0, values = (var_3157_cast_fp16, var_2997_cast_fp16))[name = tensor<string, []>("op_3251_cast_fp16")];
            tensor<fp16, []> var_3252_to_fp16 = const()[name = tensor<string, []>("op_3252_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_277_cast_fp16 = mul(x = var_3251_cast_fp16, y = var_3252_to_fp16)[name = tensor<string, []>("aw_chunk_277_cast_fp16")];
            tensor<string, []> var_3255_equation_0 = const()[name = tensor<string, []>("op_3255_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3255_cast_fp16 = einsum(equation = var_3255_equation_0, values = (var_3157_cast_fp16, var_3004_cast_fp16))[name = tensor<string, []>("op_3255_cast_fp16")];
            tensor<fp16, []> var_3256_to_fp16 = const()[name = tensor<string, []>("op_3256_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_279_cast_fp16 = mul(x = var_3255_cast_fp16, y = var_3256_to_fp16)[name = tensor<string, []>("aw_chunk_279_cast_fp16")];
            tensor<string, []> var_3259_equation_0 = const()[name = tensor<string, []>("op_3259_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3259_cast_fp16 = einsum(equation = var_3259_equation_0, values = (var_3161_cast_fp16, var_3011_cast_fp16))[name = tensor<string, []>("op_3259_cast_fp16")];
            tensor<fp16, []> var_3260_to_fp16 = const()[name = tensor<string, []>("op_3260_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_281_cast_fp16 = mul(x = var_3259_cast_fp16, y = var_3260_to_fp16)[name = tensor<string, []>("aw_chunk_281_cast_fp16")];
            tensor<string, []> var_3263_equation_0 = const()[name = tensor<string, []>("op_3263_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3263_cast_fp16 = einsum(equation = var_3263_equation_0, values = (var_3161_cast_fp16, var_3018_cast_fp16))[name = tensor<string, []>("op_3263_cast_fp16")];
            tensor<fp16, []> var_3264_to_fp16 = const()[name = tensor<string, []>("op_3264_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_283_cast_fp16 = mul(x = var_3263_cast_fp16, y = var_3264_to_fp16)[name = tensor<string, []>("aw_chunk_283_cast_fp16")];
            tensor<string, []> var_3267_equation_0 = const()[name = tensor<string, []>("op_3267_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3267_cast_fp16 = einsum(equation = var_3267_equation_0, values = (var_3161_cast_fp16, var_3025_cast_fp16))[name = tensor<string, []>("op_3267_cast_fp16")];
            tensor<fp16, []> var_3268_to_fp16 = const()[name = tensor<string, []>("op_3268_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_285_cast_fp16 = mul(x = var_3267_cast_fp16, y = var_3268_to_fp16)[name = tensor<string, []>("aw_chunk_285_cast_fp16")];
            tensor<string, []> var_3271_equation_0 = const()[name = tensor<string, []>("op_3271_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3271_cast_fp16 = einsum(equation = var_3271_equation_0, values = (var_3161_cast_fp16, var_3032_cast_fp16))[name = tensor<string, []>("op_3271_cast_fp16")];
            tensor<fp16, []> var_3272_to_fp16 = const()[name = tensor<string, []>("op_3272_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_287_cast_fp16 = mul(x = var_3271_cast_fp16, y = var_3272_to_fp16)[name = tensor<string, []>("aw_chunk_287_cast_fp16")];
            tensor<string, []> var_3275_equation_0 = const()[name = tensor<string, []>("op_3275_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3275_cast_fp16 = einsum(equation = var_3275_equation_0, values = (var_3165_cast_fp16, var_3039_cast_fp16))[name = tensor<string, []>("op_3275_cast_fp16")];
            tensor<fp16, []> var_3276_to_fp16 = const()[name = tensor<string, []>("op_3276_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_289_cast_fp16 = mul(x = var_3275_cast_fp16, y = var_3276_to_fp16)[name = tensor<string, []>("aw_chunk_289_cast_fp16")];
            tensor<string, []> var_3279_equation_0 = const()[name = tensor<string, []>("op_3279_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3279_cast_fp16 = einsum(equation = var_3279_equation_0, values = (var_3165_cast_fp16, var_3046_cast_fp16))[name = tensor<string, []>("op_3279_cast_fp16")];
            tensor<fp16, []> var_3280_to_fp16 = const()[name = tensor<string, []>("op_3280_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_291_cast_fp16 = mul(x = var_3279_cast_fp16, y = var_3280_to_fp16)[name = tensor<string, []>("aw_chunk_291_cast_fp16")];
            tensor<string, []> var_3283_equation_0 = const()[name = tensor<string, []>("op_3283_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3283_cast_fp16 = einsum(equation = var_3283_equation_0, values = (var_3165_cast_fp16, var_3053_cast_fp16))[name = tensor<string, []>("op_3283_cast_fp16")];
            tensor<fp16, []> var_3284_to_fp16 = const()[name = tensor<string, []>("op_3284_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_293_cast_fp16 = mul(x = var_3283_cast_fp16, y = var_3284_to_fp16)[name = tensor<string, []>("aw_chunk_293_cast_fp16")];
            tensor<string, []> var_3287_equation_0 = const()[name = tensor<string, []>("op_3287_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3287_cast_fp16 = einsum(equation = var_3287_equation_0, values = (var_3165_cast_fp16, var_3060_cast_fp16))[name = tensor<string, []>("op_3287_cast_fp16")];
            tensor<fp16, []> var_3288_to_fp16 = const()[name = tensor<string, []>("op_3288_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_295_cast_fp16 = mul(x = var_3287_cast_fp16, y = var_3288_to_fp16)[name = tensor<string, []>("aw_chunk_295_cast_fp16")];
            tensor<string, []> var_3291_equation_0 = const()[name = tensor<string, []>("op_3291_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3291_cast_fp16 = einsum(equation = var_3291_equation_0, values = (var_3169_cast_fp16, var_3067_cast_fp16))[name = tensor<string, []>("op_3291_cast_fp16")];
            tensor<fp16, []> var_3292_to_fp16 = const()[name = tensor<string, []>("op_3292_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_297_cast_fp16 = mul(x = var_3291_cast_fp16, y = var_3292_to_fp16)[name = tensor<string, []>("aw_chunk_297_cast_fp16")];
            tensor<string, []> var_3295_equation_0 = const()[name = tensor<string, []>("op_3295_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3295_cast_fp16 = einsum(equation = var_3295_equation_0, values = (var_3169_cast_fp16, var_3074_cast_fp16))[name = tensor<string, []>("op_3295_cast_fp16")];
            tensor<fp16, []> var_3296_to_fp16 = const()[name = tensor<string, []>("op_3296_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_299_cast_fp16 = mul(x = var_3295_cast_fp16, y = var_3296_to_fp16)[name = tensor<string, []>("aw_chunk_299_cast_fp16")];
            tensor<string, []> var_3299_equation_0 = const()[name = tensor<string, []>("op_3299_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3299_cast_fp16 = einsum(equation = var_3299_equation_0, values = (var_3169_cast_fp16, var_3081_cast_fp16))[name = tensor<string, []>("op_3299_cast_fp16")];
            tensor<fp16, []> var_3300_to_fp16 = const()[name = tensor<string, []>("op_3300_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_301_cast_fp16 = mul(x = var_3299_cast_fp16, y = var_3300_to_fp16)[name = tensor<string, []>("aw_chunk_301_cast_fp16")];
            tensor<string, []> var_3303_equation_0 = const()[name = tensor<string, []>("op_3303_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3303_cast_fp16 = einsum(equation = var_3303_equation_0, values = (var_3169_cast_fp16, var_3088_cast_fp16))[name = tensor<string, []>("op_3303_cast_fp16")];
            tensor<fp16, []> var_3304_to_fp16 = const()[name = tensor<string, []>("op_3304_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_303_cast_fp16 = mul(x = var_3303_cast_fp16, y = var_3304_to_fp16)[name = tensor<string, []>("aw_chunk_303_cast_fp16")];
            tensor<string, []> var_3307_equation_0 = const()[name = tensor<string, []>("op_3307_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3307_cast_fp16 = einsum(equation = var_3307_equation_0, values = (var_3173_cast_fp16, var_3095_cast_fp16))[name = tensor<string, []>("op_3307_cast_fp16")];
            tensor<fp16, []> var_3308_to_fp16 = const()[name = tensor<string, []>("op_3308_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_305_cast_fp16 = mul(x = var_3307_cast_fp16, y = var_3308_to_fp16)[name = tensor<string, []>("aw_chunk_305_cast_fp16")];
            tensor<string, []> var_3311_equation_0 = const()[name = tensor<string, []>("op_3311_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3311_cast_fp16 = einsum(equation = var_3311_equation_0, values = (var_3173_cast_fp16, var_3102_cast_fp16))[name = tensor<string, []>("op_3311_cast_fp16")];
            tensor<fp16, []> var_3312_to_fp16 = const()[name = tensor<string, []>("op_3312_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_307_cast_fp16 = mul(x = var_3311_cast_fp16, y = var_3312_to_fp16)[name = tensor<string, []>("aw_chunk_307_cast_fp16")];
            tensor<string, []> var_3315_equation_0 = const()[name = tensor<string, []>("op_3315_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3315_cast_fp16 = einsum(equation = var_3315_equation_0, values = (var_3173_cast_fp16, var_3109_cast_fp16))[name = tensor<string, []>("op_3315_cast_fp16")];
            tensor<fp16, []> var_3316_to_fp16 = const()[name = tensor<string, []>("op_3316_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_309_cast_fp16 = mul(x = var_3315_cast_fp16, y = var_3316_to_fp16)[name = tensor<string, []>("aw_chunk_309_cast_fp16")];
            tensor<string, []> var_3319_equation_0 = const()[name = tensor<string, []>("op_3319_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3319_cast_fp16 = einsum(equation = var_3319_equation_0, values = (var_3173_cast_fp16, var_3116_cast_fp16))[name = tensor<string, []>("op_3319_cast_fp16")];
            tensor<fp16, []> var_3320_to_fp16 = const()[name = tensor<string, []>("op_3320_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_311_cast_fp16 = mul(x = var_3319_cast_fp16, y = var_3320_to_fp16)[name = tensor<string, []>("aw_chunk_311_cast_fp16")];
            tensor<string, []> var_3323_equation_0 = const()[name = tensor<string, []>("op_3323_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3323_cast_fp16 = einsum(equation = var_3323_equation_0, values = (var_3177_cast_fp16, var_3123_cast_fp16))[name = tensor<string, []>("op_3323_cast_fp16")];
            tensor<fp16, []> var_3324_to_fp16 = const()[name = tensor<string, []>("op_3324_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_313_cast_fp16 = mul(x = var_3323_cast_fp16, y = var_3324_to_fp16)[name = tensor<string, []>("aw_chunk_313_cast_fp16")];
            tensor<string, []> var_3327_equation_0 = const()[name = tensor<string, []>("op_3327_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3327_cast_fp16 = einsum(equation = var_3327_equation_0, values = (var_3177_cast_fp16, var_3130_cast_fp16))[name = tensor<string, []>("op_3327_cast_fp16")];
            tensor<fp16, []> var_3328_to_fp16 = const()[name = tensor<string, []>("op_3328_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_315_cast_fp16 = mul(x = var_3327_cast_fp16, y = var_3328_to_fp16)[name = tensor<string, []>("aw_chunk_315_cast_fp16")];
            tensor<string, []> var_3331_equation_0 = const()[name = tensor<string, []>("op_3331_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3331_cast_fp16 = einsum(equation = var_3331_equation_0, values = (var_3177_cast_fp16, var_3137_cast_fp16))[name = tensor<string, []>("op_3331_cast_fp16")];
            tensor<fp16, []> var_3332_to_fp16 = const()[name = tensor<string, []>("op_3332_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_317_cast_fp16 = mul(x = var_3331_cast_fp16, y = var_3332_to_fp16)[name = tensor<string, []>("aw_chunk_317_cast_fp16")];
            tensor<string, []> var_3335_equation_0 = const()[name = tensor<string, []>("op_3335_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3335_cast_fp16 = einsum(equation = var_3335_equation_0, values = (var_3177_cast_fp16, var_3144_cast_fp16))[name = tensor<string, []>("op_3335_cast_fp16")];
            tensor<fp16, []> var_3336_to_fp16 = const()[name = tensor<string, []>("op_3336_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_319_cast_fp16 = mul(x = var_3335_cast_fp16, y = var_3336_to_fp16)[name = tensor<string, []>("aw_chunk_319_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3338_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_257_cast_fp16)[name = tensor<string, []>("op_3338_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3339_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_259_cast_fp16)[name = tensor<string, []>("op_3339_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3340_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_261_cast_fp16)[name = tensor<string, []>("op_3340_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3341_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_263_cast_fp16)[name = tensor<string, []>("op_3341_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3342_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_265_cast_fp16)[name = tensor<string, []>("op_3342_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3343_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_267_cast_fp16)[name = tensor<string, []>("op_3343_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3344_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_269_cast_fp16)[name = tensor<string, []>("op_3344_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3345_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_271_cast_fp16)[name = tensor<string, []>("op_3345_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3346_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_273_cast_fp16)[name = tensor<string, []>("op_3346_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3347_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_275_cast_fp16)[name = tensor<string, []>("op_3347_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3348_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_277_cast_fp16)[name = tensor<string, []>("op_3348_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3349_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_279_cast_fp16)[name = tensor<string, []>("op_3349_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3350_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_281_cast_fp16)[name = tensor<string, []>("op_3350_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3351_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_283_cast_fp16)[name = tensor<string, []>("op_3351_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3352_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_285_cast_fp16)[name = tensor<string, []>("op_3352_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3353_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_287_cast_fp16)[name = tensor<string, []>("op_3353_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3354_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_289_cast_fp16)[name = tensor<string, []>("op_3354_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3355_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_291_cast_fp16)[name = tensor<string, []>("op_3355_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3356_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_293_cast_fp16)[name = tensor<string, []>("op_3356_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3357_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_295_cast_fp16)[name = tensor<string, []>("op_3357_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3358_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_297_cast_fp16)[name = tensor<string, []>("op_3358_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3359_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_299_cast_fp16)[name = tensor<string, []>("op_3359_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3360_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_301_cast_fp16)[name = tensor<string, []>("op_3360_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3361_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_303_cast_fp16)[name = tensor<string, []>("op_3361_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3362_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_305_cast_fp16)[name = tensor<string, []>("op_3362_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3363_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_307_cast_fp16)[name = tensor<string, []>("op_3363_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3364_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_309_cast_fp16)[name = tensor<string, []>("op_3364_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3365_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_311_cast_fp16)[name = tensor<string, []>("op_3365_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3366_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_313_cast_fp16)[name = tensor<string, []>("op_3366_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3367_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_315_cast_fp16)[name = tensor<string, []>("op_3367_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3368_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_317_cast_fp16)[name = tensor<string, []>("op_3368_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_3369_cast_fp16 = softmax(axis = var_2835, x = aw_chunk_319_cast_fp16)[name = tensor<string, []>("op_3369_cast_fp16")];
            tensor<string, []> var_3371_equation_0 = const()[name = tensor<string, []>("op_3371_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3371_cast_fp16 = einsum(equation = var_3371_equation_0, values = (var_3179_cast_fp16, var_3338_cast_fp16))[name = tensor<string, []>("op_3371_cast_fp16")];
            tensor<string, []> var_3373_equation_0 = const()[name = tensor<string, []>("op_3373_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3373_cast_fp16 = einsum(equation = var_3373_equation_0, values = (var_3179_cast_fp16, var_3339_cast_fp16))[name = tensor<string, []>("op_3373_cast_fp16")];
            tensor<string, []> var_3375_equation_0 = const()[name = tensor<string, []>("op_3375_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3375_cast_fp16 = einsum(equation = var_3375_equation_0, values = (var_3179_cast_fp16, var_3340_cast_fp16))[name = tensor<string, []>("op_3375_cast_fp16")];
            tensor<string, []> var_3377_equation_0 = const()[name = tensor<string, []>("op_3377_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3377_cast_fp16 = einsum(equation = var_3377_equation_0, values = (var_3179_cast_fp16, var_3341_cast_fp16))[name = tensor<string, []>("op_3377_cast_fp16")];
            tensor<string, []> var_3379_equation_0 = const()[name = tensor<string, []>("op_3379_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3379_cast_fp16 = einsum(equation = var_3379_equation_0, values = (var_3183_cast_fp16, var_3342_cast_fp16))[name = tensor<string, []>("op_3379_cast_fp16")];
            tensor<string, []> var_3381_equation_0 = const()[name = tensor<string, []>("op_3381_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3381_cast_fp16 = einsum(equation = var_3381_equation_0, values = (var_3183_cast_fp16, var_3343_cast_fp16))[name = tensor<string, []>("op_3381_cast_fp16")];
            tensor<string, []> var_3383_equation_0 = const()[name = tensor<string, []>("op_3383_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3383_cast_fp16 = einsum(equation = var_3383_equation_0, values = (var_3183_cast_fp16, var_3344_cast_fp16))[name = tensor<string, []>("op_3383_cast_fp16")];
            tensor<string, []> var_3385_equation_0 = const()[name = tensor<string, []>("op_3385_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3385_cast_fp16 = einsum(equation = var_3385_equation_0, values = (var_3183_cast_fp16, var_3345_cast_fp16))[name = tensor<string, []>("op_3385_cast_fp16")];
            tensor<string, []> var_3387_equation_0 = const()[name = tensor<string, []>("op_3387_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3387_cast_fp16 = einsum(equation = var_3387_equation_0, values = (var_3187_cast_fp16, var_3346_cast_fp16))[name = tensor<string, []>("op_3387_cast_fp16")];
            tensor<string, []> var_3389_equation_0 = const()[name = tensor<string, []>("op_3389_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3389_cast_fp16 = einsum(equation = var_3389_equation_0, values = (var_3187_cast_fp16, var_3347_cast_fp16))[name = tensor<string, []>("op_3389_cast_fp16")];
            tensor<string, []> var_3391_equation_0 = const()[name = tensor<string, []>("op_3391_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3391_cast_fp16 = einsum(equation = var_3391_equation_0, values = (var_3187_cast_fp16, var_3348_cast_fp16))[name = tensor<string, []>("op_3391_cast_fp16")];
            tensor<string, []> var_3393_equation_0 = const()[name = tensor<string, []>("op_3393_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3393_cast_fp16 = einsum(equation = var_3393_equation_0, values = (var_3187_cast_fp16, var_3349_cast_fp16))[name = tensor<string, []>("op_3393_cast_fp16")];
            tensor<string, []> var_3395_equation_0 = const()[name = tensor<string, []>("op_3395_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3395_cast_fp16 = einsum(equation = var_3395_equation_0, values = (var_3191_cast_fp16, var_3350_cast_fp16))[name = tensor<string, []>("op_3395_cast_fp16")];
            tensor<string, []> var_3397_equation_0 = const()[name = tensor<string, []>("op_3397_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3397_cast_fp16 = einsum(equation = var_3397_equation_0, values = (var_3191_cast_fp16, var_3351_cast_fp16))[name = tensor<string, []>("op_3397_cast_fp16")];
            tensor<string, []> var_3399_equation_0 = const()[name = tensor<string, []>("op_3399_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3399_cast_fp16 = einsum(equation = var_3399_equation_0, values = (var_3191_cast_fp16, var_3352_cast_fp16))[name = tensor<string, []>("op_3399_cast_fp16")];
            tensor<string, []> var_3401_equation_0 = const()[name = tensor<string, []>("op_3401_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3401_cast_fp16 = einsum(equation = var_3401_equation_0, values = (var_3191_cast_fp16, var_3353_cast_fp16))[name = tensor<string, []>("op_3401_cast_fp16")];
            tensor<string, []> var_3403_equation_0 = const()[name = tensor<string, []>("op_3403_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3403_cast_fp16 = einsum(equation = var_3403_equation_0, values = (var_3195_cast_fp16, var_3354_cast_fp16))[name = tensor<string, []>("op_3403_cast_fp16")];
            tensor<string, []> var_3405_equation_0 = const()[name = tensor<string, []>("op_3405_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3405_cast_fp16 = einsum(equation = var_3405_equation_0, values = (var_3195_cast_fp16, var_3355_cast_fp16))[name = tensor<string, []>("op_3405_cast_fp16")];
            tensor<string, []> var_3407_equation_0 = const()[name = tensor<string, []>("op_3407_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3407_cast_fp16 = einsum(equation = var_3407_equation_0, values = (var_3195_cast_fp16, var_3356_cast_fp16))[name = tensor<string, []>("op_3407_cast_fp16")];
            tensor<string, []> var_3409_equation_0 = const()[name = tensor<string, []>("op_3409_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3409_cast_fp16 = einsum(equation = var_3409_equation_0, values = (var_3195_cast_fp16, var_3357_cast_fp16))[name = tensor<string, []>("op_3409_cast_fp16")];
            tensor<string, []> var_3411_equation_0 = const()[name = tensor<string, []>("op_3411_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3411_cast_fp16 = einsum(equation = var_3411_equation_0, values = (var_3199_cast_fp16, var_3358_cast_fp16))[name = tensor<string, []>("op_3411_cast_fp16")];
            tensor<string, []> var_3413_equation_0 = const()[name = tensor<string, []>("op_3413_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3413_cast_fp16 = einsum(equation = var_3413_equation_0, values = (var_3199_cast_fp16, var_3359_cast_fp16))[name = tensor<string, []>("op_3413_cast_fp16")];
            tensor<string, []> var_3415_equation_0 = const()[name = tensor<string, []>("op_3415_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3415_cast_fp16 = einsum(equation = var_3415_equation_0, values = (var_3199_cast_fp16, var_3360_cast_fp16))[name = tensor<string, []>("op_3415_cast_fp16")];
            tensor<string, []> var_3417_equation_0 = const()[name = tensor<string, []>("op_3417_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3417_cast_fp16 = einsum(equation = var_3417_equation_0, values = (var_3199_cast_fp16, var_3361_cast_fp16))[name = tensor<string, []>("op_3417_cast_fp16")];
            tensor<string, []> var_3419_equation_0 = const()[name = tensor<string, []>("op_3419_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3419_cast_fp16 = einsum(equation = var_3419_equation_0, values = (var_3203_cast_fp16, var_3362_cast_fp16))[name = tensor<string, []>("op_3419_cast_fp16")];
            tensor<string, []> var_3421_equation_0 = const()[name = tensor<string, []>("op_3421_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3421_cast_fp16 = einsum(equation = var_3421_equation_0, values = (var_3203_cast_fp16, var_3363_cast_fp16))[name = tensor<string, []>("op_3421_cast_fp16")];
            tensor<string, []> var_3423_equation_0 = const()[name = tensor<string, []>("op_3423_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3423_cast_fp16 = einsum(equation = var_3423_equation_0, values = (var_3203_cast_fp16, var_3364_cast_fp16))[name = tensor<string, []>("op_3423_cast_fp16")];
            tensor<string, []> var_3425_equation_0 = const()[name = tensor<string, []>("op_3425_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3425_cast_fp16 = einsum(equation = var_3425_equation_0, values = (var_3203_cast_fp16, var_3365_cast_fp16))[name = tensor<string, []>("op_3425_cast_fp16")];
            tensor<string, []> var_3427_equation_0 = const()[name = tensor<string, []>("op_3427_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3427_cast_fp16 = einsum(equation = var_3427_equation_0, values = (var_3207_cast_fp16, var_3366_cast_fp16))[name = tensor<string, []>("op_3427_cast_fp16")];
            tensor<string, []> var_3429_equation_0 = const()[name = tensor<string, []>("op_3429_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3429_cast_fp16 = einsum(equation = var_3429_equation_0, values = (var_3207_cast_fp16, var_3367_cast_fp16))[name = tensor<string, []>("op_3429_cast_fp16")];
            tensor<string, []> var_3431_equation_0 = const()[name = tensor<string, []>("op_3431_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3431_cast_fp16 = einsum(equation = var_3431_equation_0, values = (var_3207_cast_fp16, var_3368_cast_fp16))[name = tensor<string, []>("op_3431_cast_fp16")];
            tensor<string, []> var_3433_equation_0 = const()[name = tensor<string, []>("op_3433_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_3433_cast_fp16 = einsum(equation = var_3433_equation_0, values = (var_3207_cast_fp16, var_3369_cast_fp16))[name = tensor<string, []>("op_3433_cast_fp16")];
            tensor<bool, []> var_3435_interleave_0 = const()[name = tensor<string, []>("op_3435_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_3435_cast_fp16 = concat(axis = var_2822, interleave = var_3435_interleave_0, values = (var_3371_cast_fp16, var_3373_cast_fp16, var_3375_cast_fp16, var_3377_cast_fp16))[name = tensor<string, []>("op_3435_cast_fp16")];
            tensor<bool, []> var_3437_interleave_0 = const()[name = tensor<string, []>("op_3437_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_3437_cast_fp16 = concat(axis = var_2822, interleave = var_3437_interleave_0, values = (var_3379_cast_fp16, var_3381_cast_fp16, var_3383_cast_fp16, var_3385_cast_fp16))[name = tensor<string, []>("op_3437_cast_fp16")];
            tensor<bool, []> var_3439_interleave_0 = const()[name = tensor<string, []>("op_3439_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_3439_cast_fp16 = concat(axis = var_2822, interleave = var_3439_interleave_0, values = (var_3387_cast_fp16, var_3389_cast_fp16, var_3391_cast_fp16, var_3393_cast_fp16))[name = tensor<string, []>("op_3439_cast_fp16")];
            tensor<bool, []> var_3441_interleave_0 = const()[name = tensor<string, []>("op_3441_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_3441_cast_fp16 = concat(axis = var_2822, interleave = var_3441_interleave_0, values = (var_3395_cast_fp16, var_3397_cast_fp16, var_3399_cast_fp16, var_3401_cast_fp16))[name = tensor<string, []>("op_3441_cast_fp16")];
            tensor<bool, []> var_3443_interleave_0 = const()[name = tensor<string, []>("op_3443_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_3443_cast_fp16 = concat(axis = var_2822, interleave = var_3443_interleave_0, values = (var_3403_cast_fp16, var_3405_cast_fp16, var_3407_cast_fp16, var_3409_cast_fp16))[name = tensor<string, []>("op_3443_cast_fp16")];
            tensor<bool, []> var_3445_interleave_0 = const()[name = tensor<string, []>("op_3445_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_3445_cast_fp16 = concat(axis = var_2822, interleave = var_3445_interleave_0, values = (var_3411_cast_fp16, var_3413_cast_fp16, var_3415_cast_fp16, var_3417_cast_fp16))[name = tensor<string, []>("op_3445_cast_fp16")];
            tensor<bool, []> var_3447_interleave_0 = const()[name = tensor<string, []>("op_3447_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_3447_cast_fp16 = concat(axis = var_2822, interleave = var_3447_interleave_0, values = (var_3419_cast_fp16, var_3421_cast_fp16, var_3423_cast_fp16, var_3425_cast_fp16))[name = tensor<string, []>("op_3447_cast_fp16")];
            tensor<bool, []> var_3449_interleave_0 = const()[name = tensor<string, []>("op_3449_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_3449_cast_fp16 = concat(axis = var_2822, interleave = var_3449_interleave_0, values = (var_3427_cast_fp16, var_3429_cast_fp16, var_3431_cast_fp16, var_3433_cast_fp16))[name = tensor<string, []>("op_3449_cast_fp16")];
            tensor<bool, []> input_33_interleave_0 = const()[name = tensor<string, []>("input_33_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 512, 1, 1500]> input_33_cast_fp16 = concat(axis = var_2835, interleave = input_33_interleave_0, values = (var_3435_cast_fp16, var_3437_cast_fp16, var_3439_cast_fp16, var_3441_cast_fp16, var_3443_cast_fp16, var_3445_cast_fp16, var_3447_cast_fp16, var_3449_cast_fp16))[name = tensor<string, []>("input_33_cast_fp16")];
            tensor<int32, [2]> var_3454 = const()[name = tensor<string, []>("op_3454"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3456 = const()[name = tensor<string, []>("op_3456"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_19_pad_type_0 = const()[name = tensor<string, []>("obj_19_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_19_pad_0 = const()[name = tensor<string, []>("obj_19_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_4_self_attn_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_4_self_attn_o_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30155456)))];
            tensor<fp16, [512]> layers_4_self_attn_o_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_4_self_attn_o_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30679808)))];
            tensor<fp16, [1, 512, 1, 1500]> obj_19_cast_fp16 = conv(bias = layers_4_self_attn_o_proj_bias_to_fp16, dilations = var_3456, groups = var_2835, pad = obj_19_pad_0, pad_type = obj_19_pad_type_0, strides = var_3454, weight = layers_4_self_attn_o_proj_weight_to_fp16, x = input_33_cast_fp16)[name = tensor<string, []>("obj_19_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_19_cast_fp16 = add(x = inputs_17_cast_fp16, y = obj_19_cast_fp16)[name = tensor<string, []>("inputs_19_cast_fp16")];
            tensor<int32, [1]> var_3462 = const()[name = tensor<string, []>("op_3462"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_19_cast_fp16 = reduce_mean(axes = var_3462, keep_dims = var_2836, x = inputs_19_cast_fp16)[name = tensor<string, []>("channels_mean_19_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_19_cast_fp16 = sub(x = inputs_19_cast_fp16, y = channels_mean_19_cast_fp16)[name = tensor<string, []>("zero_mean_19_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_19_cast_fp16 = mul(x = zero_mean_19_cast_fp16, y = zero_mean_19_cast_fp16)[name = tensor<string, []>("zero_mean_sq_19_cast_fp16")];
            tensor<int32, [1]> var_3466 = const()[name = tensor<string, []>("op_3466"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_3467_cast_fp16 = reduce_mean(axes = var_3466, keep_dims = var_2836, x = zero_mean_sq_19_cast_fp16)[name = tensor<string, []>("op_3467_cast_fp16")];
            tensor<fp16, []> var_3468_to_fp16 = const()[name = tensor<string, []>("op_3468_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_3469_cast_fp16 = add(x = var_3467_cast_fp16, y = var_3468_to_fp16)[name = tensor<string, []>("op_3469_cast_fp16")];
            tensor<fp16, []> denom_19_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_19_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_19_cast_fp16 = rsqrt(epsilon = denom_19_epsilon_0_to_fp16, x = var_3469_cast_fp16)[name = tensor<string, []>("denom_19_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_19_cast_fp16 = mul(x = zero_mean_19_cast_fp16, y = denom_19_cast_fp16)[name = tensor<string, []>("out_19_cast_fp16")];
            tensor<fp16, [512]> input_35_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_35_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30680896)))];
            tensor<fp16, [512]> input_35_beta_0_to_fp16 = const()[name = tensor<string, []>("input_35_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30681984)))];
            tensor<fp16, []> input_35_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_35_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> input_35_cast_fp16 = batch_norm(beta = input_35_beta_0_to_fp16, epsilon = input_35_epsilon_0_to_fp16, gamma = input_35_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_19_cast_fp16)[name = tensor<string, []>("input_35_cast_fp16")];
            tensor<int32, [2]> var_3480 = const()[name = tensor<string, []>("op_3480"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3482 = const()[name = tensor<string, []>("op_3482"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> input_37_pad_type_0 = const()[name = tensor<string, []>("input_37_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> input_37_pad_0 = const()[name = tensor<string, []>("input_37_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [2048, 512, 1, 1]> layers_4_fc1_weight_to_fp16 = const()[name = tensor<string, []>("layers_4_fc1_weight_to_fp16"), val = tensor<fp16, [2048, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(30683072)))];
            tensor<fp16, [2048]> layers_4_fc1_bias_to_fp16 = const()[name = tensor<string, []>("layers_4_fc1_bias_to_fp16"), val = tensor<fp16, [2048]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(32780288)))];
            tensor<fp16, [1, 2048, 1, 1500]> input_37_cast_fp16 = conv(bias = layers_4_fc1_bias_to_fp16, dilations = var_3482, groups = var_2835, pad = input_37_pad_0, pad_type = input_37_pad_type_0, strides = var_3480, weight = layers_4_fc1_weight_to_fp16, x = input_35_cast_fp16)[name = tensor<string, []>("input_37_cast_fp16")];
            tensor<string, []> input_39_mode_0 = const()[name = tensor<string, []>("input_39_mode_0"), val = tensor<string, []>("EXACT")];
            tensor<fp16, [1, 2048, 1, 1500]> input_39_cast_fp16 = gelu(mode = input_39_mode_0, x = input_37_cast_fp16)[name = tensor<string, []>("input_39_cast_fp16")];
            tensor<int32, [2]> var_3488 = const()[name = tensor<string, []>("op_3488"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3490 = const()[name = tensor<string, []>("op_3490"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> hidden_states_13_pad_type_0 = const()[name = tensor<string, []>("hidden_states_13_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> hidden_states_13_pad_0 = const()[name = tensor<string, []>("hidden_states_13_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 2048, 1, 1]> layers_4_fc2_weight_to_fp16 = const()[name = tensor<string, []>("layers_4_fc2_weight_to_fp16"), val = tensor<fp16, [512, 2048, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(32784448)))];
            tensor<fp16, [512]> layers_4_fc2_bias_to_fp16 = const()[name = tensor<string, []>("layers_4_fc2_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(34881664)))];
            tensor<fp16, [1, 512, 1, 1500]> hidden_states_13_cast_fp16 = conv(bias = layers_4_fc2_bias_to_fp16, dilations = var_3490, groups = var_2835, pad = hidden_states_13_pad_0, pad_type = hidden_states_13_pad_type_0, strides = var_3488, weight = layers_4_fc2_weight_to_fp16, x = input_39_cast_fp16)[name = tensor<string, []>("hidden_states_13_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_21_cast_fp16 = add(x = inputs_19_cast_fp16, y = hidden_states_13_cast_fp16)[name = tensor<string, []>("inputs_21_cast_fp16")];
            tensor<int32, []> var_3497 = const()[name = tensor<string, []>("op_3497"), val = tensor<int32, []>(3)];
            tensor<int32, []> var_3510 = const()[name = tensor<string, []>("op_3510"), val = tensor<int32, []>(1)];
            tensor<bool, []> var_3511 = const()[name = tensor<string, []>("op_3511"), val = tensor<bool, []>(true)];
            tensor<int32, [1]> var_3521 = const()[name = tensor<string, []>("op_3521"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_21_cast_fp16 = reduce_mean(axes = var_3521, keep_dims = var_3511, x = inputs_21_cast_fp16)[name = tensor<string, []>("channels_mean_21_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_21_cast_fp16 = sub(x = inputs_21_cast_fp16, y = channels_mean_21_cast_fp16)[name = tensor<string, []>("zero_mean_21_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_21_cast_fp16 = mul(x = zero_mean_21_cast_fp16, y = zero_mean_21_cast_fp16)[name = tensor<string, []>("zero_mean_sq_21_cast_fp16")];
            tensor<int32, [1]> var_3525 = const()[name = tensor<string, []>("op_3525"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_3526_cast_fp16 = reduce_mean(axes = var_3525, keep_dims = var_3511, x = zero_mean_sq_21_cast_fp16)[name = tensor<string, []>("op_3526_cast_fp16")];
            tensor<fp16, []> var_3527_to_fp16 = const()[name = tensor<string, []>("op_3527_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_3528_cast_fp16 = add(x = var_3526_cast_fp16, y = var_3527_to_fp16)[name = tensor<string, []>("op_3528_cast_fp16")];
            tensor<fp16, []> denom_21_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_21_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_21_cast_fp16 = rsqrt(epsilon = denom_21_epsilon_0_to_fp16, x = var_3528_cast_fp16)[name = tensor<string, []>("denom_21_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_21_cast_fp16 = mul(x = zero_mean_21_cast_fp16, y = denom_21_cast_fp16)[name = tensor<string, []>("out_21_cast_fp16")];
            tensor<fp16, [512]> obj_21_gamma_0_to_fp16 = const()[name = tensor<string, []>("obj_21_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(34882752)))];
            tensor<fp16, [512]> obj_21_beta_0_to_fp16 = const()[name = tensor<string, []>("obj_21_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(34883840)))];
            tensor<fp16, []> obj_21_epsilon_0_to_fp16 = const()[name = tensor<string, []>("obj_21_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> obj_21_cast_fp16 = batch_norm(beta = obj_21_beta_0_to_fp16, epsilon = obj_21_epsilon_0_to_fp16, gamma = obj_21_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_21_cast_fp16)[name = tensor<string, []>("obj_21_cast_fp16")];
            tensor<int32, [2]> var_3543 = const()[name = tensor<string, []>("op_3543"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3545 = const()[name = tensor<string, []>("op_3545"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> query_pad_type_0 = const()[name = tensor<string, []>("query_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> query_pad_0 = const()[name = tensor<string, []>("query_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_5_self_attn_q_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_5_self_attn_q_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(34884928)))];
            tensor<fp16, [512]> layers_5_self_attn_q_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_5_self_attn_q_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35409280)))];
            tensor<fp16, [1, 512, 1, 1500]> query_cast_fp16 = conv(bias = layers_5_self_attn_q_proj_bias_to_fp16, dilations = var_3545, groups = var_3510, pad = query_pad_0, pad_type = query_pad_type_0, strides = var_3543, weight = layers_5_self_attn_q_proj_weight_to_fp16, x = obj_21_cast_fp16)[name = tensor<string, []>("query_cast_fp16")];
            tensor<int32, [2]> var_3549 = const()[name = tensor<string, []>("op_3549"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3551 = const()[name = tensor<string, []>("op_3551"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> key_pad_type_0 = const()[name = tensor<string, []>("key_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> key_pad_0 = const()[name = tensor<string, []>("key_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_5_self_attn_k_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_5_self_attn_k_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35410368)))];
            tensor<fp16, [1, 512, 1, 1500]> key_cast_fp16 = conv(dilations = var_3551, groups = var_3510, pad = key_pad_0, pad_type = key_pad_type_0, strides = var_3549, weight = layers_5_self_attn_k_proj_weight_to_fp16, x = obj_21_cast_fp16)[name = tensor<string, []>("key_cast_fp16")];
            tensor<int32, [2]> var_3556 = const()[name = tensor<string, []>("op_3556"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_3558 = const()[name = tensor<string, []>("op_3558"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> value_pad_type_0 = const()[name = tensor<string, []>("value_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> value_pad_0 = const()[name = tensor<string, []>("value_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_5_self_attn_v_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_5_self_attn_v_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(35934720)))];
            tensor<fp16, [512]> layers_5_self_attn_v_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_5_self_attn_v_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36459072)))];
            tensor<fp16, [1, 512, 1, 1500]> value_cast_fp16 = conv(bias = layers_5_self_attn_v_proj_bias_to_fp16, dilations = var_3558, groups = var_3510, pad = value_pad_0, pad_type = value_pad_type_0, strides = var_3556, weight = layers_5_self_attn_v_proj_weight_to_fp16, x = obj_21_cast_fp16)[name = tensor<string, []>("value_cast_fp16")];
            tensor<int32, [4]> var_3565_begin_0 = const()[name = tensor<string, []>("op_3565_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3565_end_0 = const()[name = tensor<string, []>("op_3565_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3565_end_mask_0 = const()[name = tensor<string, []>("op_3565_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3565_cast_fp16 = slice_by_index(begin = var_3565_begin_0, end = var_3565_end_0, end_mask = var_3565_end_mask_0, x = query_cast_fp16)[name = tensor<string, []>("op_3565_cast_fp16")];
            tensor<int32, [4]> var_3569_begin_0 = const()[name = tensor<string, []>("op_3569_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_3569_end_0 = const()[name = tensor<string, []>("op_3569_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_3569_end_mask_0 = const()[name = tensor<string, []>("op_3569_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3569_cast_fp16 = slice_by_index(begin = var_3569_begin_0, end = var_3569_end_0, end_mask = var_3569_end_mask_0, x = query_cast_fp16)[name = tensor<string, []>("op_3569_cast_fp16")];
            tensor<int32, [4]> var_3573_begin_0 = const()[name = tensor<string, []>("op_3573_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_3573_end_0 = const()[name = tensor<string, []>("op_3573_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_3573_end_mask_0 = const()[name = tensor<string, []>("op_3573_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3573_cast_fp16 = slice_by_index(begin = var_3573_begin_0, end = var_3573_end_0, end_mask = var_3573_end_mask_0, x = query_cast_fp16)[name = tensor<string, []>("op_3573_cast_fp16")];
            tensor<int32, [4]> var_3577_begin_0 = const()[name = tensor<string, []>("op_3577_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_3577_end_0 = const()[name = tensor<string, []>("op_3577_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_3577_end_mask_0 = const()[name = tensor<string, []>("op_3577_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3577_cast_fp16 = slice_by_index(begin = var_3577_begin_0, end = var_3577_end_0, end_mask = var_3577_end_mask_0, x = query_cast_fp16)[name = tensor<string, []>("op_3577_cast_fp16")];
            tensor<int32, [4]> var_3581_begin_0 = const()[name = tensor<string, []>("op_3581_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_3581_end_0 = const()[name = tensor<string, []>("op_3581_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_3581_end_mask_0 = const()[name = tensor<string, []>("op_3581_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3581_cast_fp16 = slice_by_index(begin = var_3581_begin_0, end = var_3581_end_0, end_mask = var_3581_end_mask_0, x = query_cast_fp16)[name = tensor<string, []>("op_3581_cast_fp16")];
            tensor<int32, [4]> var_3585_begin_0 = const()[name = tensor<string, []>("op_3585_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_3585_end_0 = const()[name = tensor<string, []>("op_3585_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_3585_end_mask_0 = const()[name = tensor<string, []>("op_3585_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3585_cast_fp16 = slice_by_index(begin = var_3585_begin_0, end = var_3585_end_0, end_mask = var_3585_end_mask_0, x = query_cast_fp16)[name = tensor<string, []>("op_3585_cast_fp16")];
            tensor<int32, [4]> var_3589_begin_0 = const()[name = tensor<string, []>("op_3589_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_3589_end_0 = const()[name = tensor<string, []>("op_3589_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_3589_end_mask_0 = const()[name = tensor<string, []>("op_3589_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3589_cast_fp16 = slice_by_index(begin = var_3589_begin_0, end = var_3589_end_0, end_mask = var_3589_end_mask_0, x = query_cast_fp16)[name = tensor<string, []>("op_3589_cast_fp16")];
            tensor<int32, [4]> var_3593_begin_0 = const()[name = tensor<string, []>("op_3593_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_3593_end_0 = const()[name = tensor<string, []>("op_3593_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_3593_end_mask_0 = const()[name = tensor<string, []>("op_3593_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3593_cast_fp16 = slice_by_index(begin = var_3593_begin_0, end = var_3593_end_0, end_mask = var_3593_end_mask_0, x = query_cast_fp16)[name = tensor<string, []>("op_3593_cast_fp16")];
            tensor<int32, [4]> var_3602_begin_0 = const()[name = tensor<string, []>("op_3602_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3602_end_0 = const()[name = tensor<string, []>("op_3602_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3602_end_mask_0 = const()[name = tensor<string, []>("op_3602_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3602_cast_fp16 = slice_by_index(begin = var_3602_begin_0, end = var_3602_end_0, end_mask = var_3602_end_mask_0, x = var_3565_cast_fp16)[name = tensor<string, []>("op_3602_cast_fp16")];
            tensor<int32, [4]> var_3609_begin_0 = const()[name = tensor<string, []>("op_3609_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3609_end_0 = const()[name = tensor<string, []>("op_3609_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3609_end_mask_0 = const()[name = tensor<string, []>("op_3609_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3609_cast_fp16 = slice_by_index(begin = var_3609_begin_0, end = var_3609_end_0, end_mask = var_3609_end_mask_0, x = var_3565_cast_fp16)[name = tensor<string, []>("op_3609_cast_fp16")];
            tensor<int32, [4]> var_3616_begin_0 = const()[name = tensor<string, []>("op_3616_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3616_end_0 = const()[name = tensor<string, []>("op_3616_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3616_end_mask_0 = const()[name = tensor<string, []>("op_3616_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3616_cast_fp16 = slice_by_index(begin = var_3616_begin_0, end = var_3616_end_0, end_mask = var_3616_end_mask_0, x = var_3565_cast_fp16)[name = tensor<string, []>("op_3616_cast_fp16")];
            tensor<int32, [4]> var_3623_begin_0 = const()[name = tensor<string, []>("op_3623_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3623_end_0 = const()[name = tensor<string, []>("op_3623_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3623_end_mask_0 = const()[name = tensor<string, []>("op_3623_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3623_cast_fp16 = slice_by_index(begin = var_3623_begin_0, end = var_3623_end_0, end_mask = var_3623_end_mask_0, x = var_3565_cast_fp16)[name = tensor<string, []>("op_3623_cast_fp16")];
            tensor<int32, [4]> var_3630_begin_0 = const()[name = tensor<string, []>("op_3630_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3630_end_0 = const()[name = tensor<string, []>("op_3630_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3630_end_mask_0 = const()[name = tensor<string, []>("op_3630_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3630_cast_fp16 = slice_by_index(begin = var_3630_begin_0, end = var_3630_end_0, end_mask = var_3630_end_mask_0, x = var_3569_cast_fp16)[name = tensor<string, []>("op_3630_cast_fp16")];
            tensor<int32, [4]> var_3637_begin_0 = const()[name = tensor<string, []>("op_3637_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3637_end_0 = const()[name = tensor<string, []>("op_3637_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3637_end_mask_0 = const()[name = tensor<string, []>("op_3637_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3637_cast_fp16 = slice_by_index(begin = var_3637_begin_0, end = var_3637_end_0, end_mask = var_3637_end_mask_0, x = var_3569_cast_fp16)[name = tensor<string, []>("op_3637_cast_fp16")];
            tensor<int32, [4]> var_3644_begin_0 = const()[name = tensor<string, []>("op_3644_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3644_end_0 = const()[name = tensor<string, []>("op_3644_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3644_end_mask_0 = const()[name = tensor<string, []>("op_3644_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3644_cast_fp16 = slice_by_index(begin = var_3644_begin_0, end = var_3644_end_0, end_mask = var_3644_end_mask_0, x = var_3569_cast_fp16)[name = tensor<string, []>("op_3644_cast_fp16")];
            tensor<int32, [4]> var_3651_begin_0 = const()[name = tensor<string, []>("op_3651_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3651_end_0 = const()[name = tensor<string, []>("op_3651_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3651_end_mask_0 = const()[name = tensor<string, []>("op_3651_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3651_cast_fp16 = slice_by_index(begin = var_3651_begin_0, end = var_3651_end_0, end_mask = var_3651_end_mask_0, x = var_3569_cast_fp16)[name = tensor<string, []>("op_3651_cast_fp16")];
            tensor<int32, [4]> var_3658_begin_0 = const()[name = tensor<string, []>("op_3658_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3658_end_0 = const()[name = tensor<string, []>("op_3658_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3658_end_mask_0 = const()[name = tensor<string, []>("op_3658_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3658_cast_fp16 = slice_by_index(begin = var_3658_begin_0, end = var_3658_end_0, end_mask = var_3658_end_mask_0, x = var_3573_cast_fp16)[name = tensor<string, []>("op_3658_cast_fp16")];
            tensor<int32, [4]> var_3665_begin_0 = const()[name = tensor<string, []>("op_3665_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3665_end_0 = const()[name = tensor<string, []>("op_3665_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3665_end_mask_0 = const()[name = tensor<string, []>("op_3665_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3665_cast_fp16 = slice_by_index(begin = var_3665_begin_0, end = var_3665_end_0, end_mask = var_3665_end_mask_0, x = var_3573_cast_fp16)[name = tensor<string, []>("op_3665_cast_fp16")];
            tensor<int32, [4]> var_3672_begin_0 = const()[name = tensor<string, []>("op_3672_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3672_end_0 = const()[name = tensor<string, []>("op_3672_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3672_end_mask_0 = const()[name = tensor<string, []>("op_3672_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3672_cast_fp16 = slice_by_index(begin = var_3672_begin_0, end = var_3672_end_0, end_mask = var_3672_end_mask_0, x = var_3573_cast_fp16)[name = tensor<string, []>("op_3672_cast_fp16")];
            tensor<int32, [4]> var_3679_begin_0 = const()[name = tensor<string, []>("op_3679_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3679_end_0 = const()[name = tensor<string, []>("op_3679_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3679_end_mask_0 = const()[name = tensor<string, []>("op_3679_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3679_cast_fp16 = slice_by_index(begin = var_3679_begin_0, end = var_3679_end_0, end_mask = var_3679_end_mask_0, x = var_3573_cast_fp16)[name = tensor<string, []>("op_3679_cast_fp16")];
            tensor<int32, [4]> var_3686_begin_0 = const()[name = tensor<string, []>("op_3686_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3686_end_0 = const()[name = tensor<string, []>("op_3686_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3686_end_mask_0 = const()[name = tensor<string, []>("op_3686_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3686_cast_fp16 = slice_by_index(begin = var_3686_begin_0, end = var_3686_end_0, end_mask = var_3686_end_mask_0, x = var_3577_cast_fp16)[name = tensor<string, []>("op_3686_cast_fp16")];
            tensor<int32, [4]> var_3693_begin_0 = const()[name = tensor<string, []>("op_3693_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3693_end_0 = const()[name = tensor<string, []>("op_3693_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3693_end_mask_0 = const()[name = tensor<string, []>("op_3693_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3693_cast_fp16 = slice_by_index(begin = var_3693_begin_0, end = var_3693_end_0, end_mask = var_3693_end_mask_0, x = var_3577_cast_fp16)[name = tensor<string, []>("op_3693_cast_fp16")];
            tensor<int32, [4]> var_3700_begin_0 = const()[name = tensor<string, []>("op_3700_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3700_end_0 = const()[name = tensor<string, []>("op_3700_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3700_end_mask_0 = const()[name = tensor<string, []>("op_3700_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3700_cast_fp16 = slice_by_index(begin = var_3700_begin_0, end = var_3700_end_0, end_mask = var_3700_end_mask_0, x = var_3577_cast_fp16)[name = tensor<string, []>("op_3700_cast_fp16")];
            tensor<int32, [4]> var_3707_begin_0 = const()[name = tensor<string, []>("op_3707_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3707_end_0 = const()[name = tensor<string, []>("op_3707_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3707_end_mask_0 = const()[name = tensor<string, []>("op_3707_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3707_cast_fp16 = slice_by_index(begin = var_3707_begin_0, end = var_3707_end_0, end_mask = var_3707_end_mask_0, x = var_3577_cast_fp16)[name = tensor<string, []>("op_3707_cast_fp16")];
            tensor<int32, [4]> var_3714_begin_0 = const()[name = tensor<string, []>("op_3714_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3714_end_0 = const()[name = tensor<string, []>("op_3714_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3714_end_mask_0 = const()[name = tensor<string, []>("op_3714_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3714_cast_fp16 = slice_by_index(begin = var_3714_begin_0, end = var_3714_end_0, end_mask = var_3714_end_mask_0, x = var_3581_cast_fp16)[name = tensor<string, []>("op_3714_cast_fp16")];
            tensor<int32, [4]> var_3721_begin_0 = const()[name = tensor<string, []>("op_3721_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3721_end_0 = const()[name = tensor<string, []>("op_3721_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3721_end_mask_0 = const()[name = tensor<string, []>("op_3721_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3721_cast_fp16 = slice_by_index(begin = var_3721_begin_0, end = var_3721_end_0, end_mask = var_3721_end_mask_0, x = var_3581_cast_fp16)[name = tensor<string, []>("op_3721_cast_fp16")];
            tensor<int32, [4]> var_3728_begin_0 = const()[name = tensor<string, []>("op_3728_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3728_end_0 = const()[name = tensor<string, []>("op_3728_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3728_end_mask_0 = const()[name = tensor<string, []>("op_3728_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3728_cast_fp16 = slice_by_index(begin = var_3728_begin_0, end = var_3728_end_0, end_mask = var_3728_end_mask_0, x = var_3581_cast_fp16)[name = tensor<string, []>("op_3728_cast_fp16")];
            tensor<int32, [4]> var_3735_begin_0 = const()[name = tensor<string, []>("op_3735_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3735_end_0 = const()[name = tensor<string, []>("op_3735_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3735_end_mask_0 = const()[name = tensor<string, []>("op_3735_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3735_cast_fp16 = slice_by_index(begin = var_3735_begin_0, end = var_3735_end_0, end_mask = var_3735_end_mask_0, x = var_3581_cast_fp16)[name = tensor<string, []>("op_3735_cast_fp16")];
            tensor<int32, [4]> var_3742_begin_0 = const()[name = tensor<string, []>("op_3742_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3742_end_0 = const()[name = tensor<string, []>("op_3742_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3742_end_mask_0 = const()[name = tensor<string, []>("op_3742_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3742_cast_fp16 = slice_by_index(begin = var_3742_begin_0, end = var_3742_end_0, end_mask = var_3742_end_mask_0, x = var_3585_cast_fp16)[name = tensor<string, []>("op_3742_cast_fp16")];
            tensor<int32, [4]> var_3749_begin_0 = const()[name = tensor<string, []>("op_3749_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3749_end_0 = const()[name = tensor<string, []>("op_3749_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3749_end_mask_0 = const()[name = tensor<string, []>("op_3749_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3749_cast_fp16 = slice_by_index(begin = var_3749_begin_0, end = var_3749_end_0, end_mask = var_3749_end_mask_0, x = var_3585_cast_fp16)[name = tensor<string, []>("op_3749_cast_fp16")];
            tensor<int32, [4]> var_3756_begin_0 = const()[name = tensor<string, []>("op_3756_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3756_end_0 = const()[name = tensor<string, []>("op_3756_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3756_end_mask_0 = const()[name = tensor<string, []>("op_3756_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3756_cast_fp16 = slice_by_index(begin = var_3756_begin_0, end = var_3756_end_0, end_mask = var_3756_end_mask_0, x = var_3585_cast_fp16)[name = tensor<string, []>("op_3756_cast_fp16")];
            tensor<int32, [4]> var_3763_begin_0 = const()[name = tensor<string, []>("op_3763_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3763_end_0 = const()[name = tensor<string, []>("op_3763_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3763_end_mask_0 = const()[name = tensor<string, []>("op_3763_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3763_cast_fp16 = slice_by_index(begin = var_3763_begin_0, end = var_3763_end_0, end_mask = var_3763_end_mask_0, x = var_3585_cast_fp16)[name = tensor<string, []>("op_3763_cast_fp16")];
            tensor<int32, [4]> var_3770_begin_0 = const()[name = tensor<string, []>("op_3770_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3770_end_0 = const()[name = tensor<string, []>("op_3770_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3770_end_mask_0 = const()[name = tensor<string, []>("op_3770_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3770_cast_fp16 = slice_by_index(begin = var_3770_begin_0, end = var_3770_end_0, end_mask = var_3770_end_mask_0, x = var_3589_cast_fp16)[name = tensor<string, []>("op_3770_cast_fp16")];
            tensor<int32, [4]> var_3777_begin_0 = const()[name = tensor<string, []>("op_3777_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3777_end_0 = const()[name = tensor<string, []>("op_3777_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3777_end_mask_0 = const()[name = tensor<string, []>("op_3777_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3777_cast_fp16 = slice_by_index(begin = var_3777_begin_0, end = var_3777_end_0, end_mask = var_3777_end_mask_0, x = var_3589_cast_fp16)[name = tensor<string, []>("op_3777_cast_fp16")];
            tensor<int32, [4]> var_3784_begin_0 = const()[name = tensor<string, []>("op_3784_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3784_end_0 = const()[name = tensor<string, []>("op_3784_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3784_end_mask_0 = const()[name = tensor<string, []>("op_3784_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3784_cast_fp16 = slice_by_index(begin = var_3784_begin_0, end = var_3784_end_0, end_mask = var_3784_end_mask_0, x = var_3589_cast_fp16)[name = tensor<string, []>("op_3784_cast_fp16")];
            tensor<int32, [4]> var_3791_begin_0 = const()[name = tensor<string, []>("op_3791_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3791_end_0 = const()[name = tensor<string, []>("op_3791_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3791_end_mask_0 = const()[name = tensor<string, []>("op_3791_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3791_cast_fp16 = slice_by_index(begin = var_3791_begin_0, end = var_3791_end_0, end_mask = var_3791_end_mask_0, x = var_3589_cast_fp16)[name = tensor<string, []>("op_3791_cast_fp16")];
            tensor<int32, [4]> var_3798_begin_0 = const()[name = tensor<string, []>("op_3798_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3798_end_0 = const()[name = tensor<string, []>("op_3798_end_0"), val = tensor<int32, [4]>([1, 64, 1, 375])];
            tensor<bool, [4]> var_3798_end_mask_0 = const()[name = tensor<string, []>("op_3798_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3798_cast_fp16 = slice_by_index(begin = var_3798_begin_0, end = var_3798_end_0, end_mask = var_3798_end_mask_0, x = var_3593_cast_fp16)[name = tensor<string, []>("op_3798_cast_fp16")];
            tensor<int32, [4]> var_3805_begin_0 = const()[name = tensor<string, []>("op_3805_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 375])];
            tensor<int32, [4]> var_3805_end_0 = const()[name = tensor<string, []>("op_3805_end_0"), val = tensor<int32, [4]>([1, 64, 1, 750])];
            tensor<bool, [4]> var_3805_end_mask_0 = const()[name = tensor<string, []>("op_3805_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3805_cast_fp16 = slice_by_index(begin = var_3805_begin_0, end = var_3805_end_0, end_mask = var_3805_end_mask_0, x = var_3593_cast_fp16)[name = tensor<string, []>("op_3805_cast_fp16")];
            tensor<int32, [4]> var_3812_begin_0 = const()[name = tensor<string, []>("op_3812_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 750])];
            tensor<int32, [4]> var_3812_end_0 = const()[name = tensor<string, []>("op_3812_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1125])];
            tensor<bool, [4]> var_3812_end_mask_0 = const()[name = tensor<string, []>("op_3812_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3812_cast_fp16 = slice_by_index(begin = var_3812_begin_0, end = var_3812_end_0, end_mask = var_3812_end_mask_0, x = var_3593_cast_fp16)[name = tensor<string, []>("op_3812_cast_fp16")];
            tensor<int32, [4]> var_3819_begin_0 = const()[name = tensor<string, []>("op_3819_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 1125])];
            tensor<int32, [4]> var_3819_end_0 = const()[name = tensor<string, []>("op_3819_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3819_end_mask_0 = const()[name = tensor<string, []>("op_3819_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 64, 1, 375]> var_3819_cast_fp16 = slice_by_index(begin = var_3819_begin_0, end = var_3819_end_0, end_mask = var_3819_end_mask_0, x = var_3593_cast_fp16)[name = tensor<string, []>("op_3819_cast_fp16")];
            tensor<int32, [4]> k_perm_0 = const()[name = tensor<string, []>("k_perm_0"), val = tensor<int32, [4]>([0, 3, 2, 1])];
            tensor<int32, [4]> var_3824_begin_0 = const()[name = tensor<string, []>("op_3824_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3824_end_0 = const()[name = tensor<string, []>("op_3824_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 64])];
            tensor<bool, [4]> var_3824_end_mask_0 = const()[name = tensor<string, []>("op_3824_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 512]> transpose_0 = transpose(perm = k_perm_0, x = key_cast_fp16)[name = tensor<string, []>("transpose_0")];
            tensor<fp16, [1, 1500, 1, 64]> var_3824_cast_fp16 = slice_by_index(begin = var_3824_begin_0, end = var_3824_end_0, end_mask = var_3824_end_mask_0, x = transpose_0)[name = tensor<string, []>("op_3824_cast_fp16")];
            tensor<int32, [4]> var_3828_begin_0 = const()[name = tensor<string, []>("op_3828_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 64])];
            tensor<int32, [4]> var_3828_end_0 = const()[name = tensor<string, []>("op_3828_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 128])];
            tensor<bool, [4]> var_3828_end_mask_0 = const()[name = tensor<string, []>("op_3828_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3828_cast_fp16 = slice_by_index(begin = var_3828_begin_0, end = var_3828_end_0, end_mask = var_3828_end_mask_0, x = transpose_0)[name = tensor<string, []>("op_3828_cast_fp16")];
            tensor<int32, [4]> var_3832_begin_0 = const()[name = tensor<string, []>("op_3832_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 128])];
            tensor<int32, [4]> var_3832_end_0 = const()[name = tensor<string, []>("op_3832_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 192])];
            tensor<bool, [4]> var_3832_end_mask_0 = const()[name = tensor<string, []>("op_3832_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3832_cast_fp16 = slice_by_index(begin = var_3832_begin_0, end = var_3832_end_0, end_mask = var_3832_end_mask_0, x = transpose_0)[name = tensor<string, []>("op_3832_cast_fp16")];
            tensor<int32, [4]> var_3836_begin_0 = const()[name = tensor<string, []>("op_3836_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 192])];
            tensor<int32, [4]> var_3836_end_0 = const()[name = tensor<string, []>("op_3836_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 256])];
            tensor<bool, [4]> var_3836_end_mask_0 = const()[name = tensor<string, []>("op_3836_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3836_cast_fp16 = slice_by_index(begin = var_3836_begin_0, end = var_3836_end_0, end_mask = var_3836_end_mask_0, x = transpose_0)[name = tensor<string, []>("op_3836_cast_fp16")];
            tensor<int32, [4]> var_3840_begin_0 = const()[name = tensor<string, []>("op_3840_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 256])];
            tensor<int32, [4]> var_3840_end_0 = const()[name = tensor<string, []>("op_3840_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 320])];
            tensor<bool, [4]> var_3840_end_mask_0 = const()[name = tensor<string, []>("op_3840_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3840_cast_fp16 = slice_by_index(begin = var_3840_begin_0, end = var_3840_end_0, end_mask = var_3840_end_mask_0, x = transpose_0)[name = tensor<string, []>("op_3840_cast_fp16")];
            tensor<int32, [4]> var_3844_begin_0 = const()[name = tensor<string, []>("op_3844_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 320])];
            tensor<int32, [4]> var_3844_end_0 = const()[name = tensor<string, []>("op_3844_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 384])];
            tensor<bool, [4]> var_3844_end_mask_0 = const()[name = tensor<string, []>("op_3844_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3844_cast_fp16 = slice_by_index(begin = var_3844_begin_0, end = var_3844_end_0, end_mask = var_3844_end_mask_0, x = transpose_0)[name = tensor<string, []>("op_3844_cast_fp16")];
            tensor<int32, [4]> var_3848_begin_0 = const()[name = tensor<string, []>("op_3848_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 384])];
            tensor<int32, [4]> var_3848_end_0 = const()[name = tensor<string, []>("op_3848_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 448])];
            tensor<bool, [4]> var_3848_end_mask_0 = const()[name = tensor<string, []>("op_3848_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3848_cast_fp16 = slice_by_index(begin = var_3848_begin_0, end = var_3848_end_0, end_mask = var_3848_end_mask_0, x = transpose_0)[name = tensor<string, []>("op_3848_cast_fp16")];
            tensor<int32, [4]> var_3852_begin_0 = const()[name = tensor<string, []>("op_3852_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 448])];
            tensor<int32, [4]> var_3852_end_0 = const()[name = tensor<string, []>("op_3852_end_0"), val = tensor<int32, [4]>([1, 1500, 1, 512])];
            tensor<bool, [4]> var_3852_end_mask_0 = const()[name = tensor<string, []>("op_3852_end_mask_0"), val = tensor<bool, [4]>([true, true, true, false])];
            tensor<fp16, [1, 1500, 1, 64]> var_3852_cast_fp16 = slice_by_index(begin = var_3852_begin_0, end = var_3852_end_0, end_mask = var_3852_end_mask_0, x = transpose_0)[name = tensor<string, []>("op_3852_cast_fp16")];
            tensor<int32, [4]> var_3854_begin_0 = const()[name = tensor<string, []>("op_3854_begin_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<int32, [4]> var_3854_end_0 = const()[name = tensor<string, []>("op_3854_end_0"), val = tensor<int32, [4]>([1, 64, 1, 1500])];
            tensor<bool, [4]> var_3854_end_mask_0 = const()[name = tensor<string, []>("op_3854_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3854_cast_fp16 = slice_by_index(begin = var_3854_begin_0, end = var_3854_end_0, end_mask = var_3854_end_mask_0, x = value_cast_fp16)[name = tensor<string, []>("op_3854_cast_fp16")];
            tensor<int32, [4]> var_3858_begin_0 = const()[name = tensor<string, []>("op_3858_begin_0"), val = tensor<int32, [4]>([0, 64, 0, 0])];
            tensor<int32, [4]> var_3858_end_0 = const()[name = tensor<string, []>("op_3858_end_0"), val = tensor<int32, [4]>([1, 128, 1, 1500])];
            tensor<bool, [4]> var_3858_end_mask_0 = const()[name = tensor<string, []>("op_3858_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3858_cast_fp16 = slice_by_index(begin = var_3858_begin_0, end = var_3858_end_0, end_mask = var_3858_end_mask_0, x = value_cast_fp16)[name = tensor<string, []>("op_3858_cast_fp16")];
            tensor<int32, [4]> var_3862_begin_0 = const()[name = tensor<string, []>("op_3862_begin_0"), val = tensor<int32, [4]>([0, 128, 0, 0])];
            tensor<int32, [4]> var_3862_end_0 = const()[name = tensor<string, []>("op_3862_end_0"), val = tensor<int32, [4]>([1, 192, 1, 1500])];
            tensor<bool, [4]> var_3862_end_mask_0 = const()[name = tensor<string, []>("op_3862_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3862_cast_fp16 = slice_by_index(begin = var_3862_begin_0, end = var_3862_end_0, end_mask = var_3862_end_mask_0, x = value_cast_fp16)[name = tensor<string, []>("op_3862_cast_fp16")];
            tensor<int32, [4]> var_3866_begin_0 = const()[name = tensor<string, []>("op_3866_begin_0"), val = tensor<int32, [4]>([0, 192, 0, 0])];
            tensor<int32, [4]> var_3866_end_0 = const()[name = tensor<string, []>("op_3866_end_0"), val = tensor<int32, [4]>([1, 256, 1, 1500])];
            tensor<bool, [4]> var_3866_end_mask_0 = const()[name = tensor<string, []>("op_3866_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3866_cast_fp16 = slice_by_index(begin = var_3866_begin_0, end = var_3866_end_0, end_mask = var_3866_end_mask_0, x = value_cast_fp16)[name = tensor<string, []>("op_3866_cast_fp16")];
            tensor<int32, [4]> var_3870_begin_0 = const()[name = tensor<string, []>("op_3870_begin_0"), val = tensor<int32, [4]>([0, 256, 0, 0])];
            tensor<int32, [4]> var_3870_end_0 = const()[name = tensor<string, []>("op_3870_end_0"), val = tensor<int32, [4]>([1, 320, 1, 1500])];
            tensor<bool, [4]> var_3870_end_mask_0 = const()[name = tensor<string, []>("op_3870_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3870_cast_fp16 = slice_by_index(begin = var_3870_begin_0, end = var_3870_end_0, end_mask = var_3870_end_mask_0, x = value_cast_fp16)[name = tensor<string, []>("op_3870_cast_fp16")];
            tensor<int32, [4]> var_3874_begin_0 = const()[name = tensor<string, []>("op_3874_begin_0"), val = tensor<int32, [4]>([0, 320, 0, 0])];
            tensor<int32, [4]> var_3874_end_0 = const()[name = tensor<string, []>("op_3874_end_0"), val = tensor<int32, [4]>([1, 384, 1, 1500])];
            tensor<bool, [4]> var_3874_end_mask_0 = const()[name = tensor<string, []>("op_3874_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3874_cast_fp16 = slice_by_index(begin = var_3874_begin_0, end = var_3874_end_0, end_mask = var_3874_end_mask_0, x = value_cast_fp16)[name = tensor<string, []>("op_3874_cast_fp16")];
            tensor<int32, [4]> var_3878_begin_0 = const()[name = tensor<string, []>("op_3878_begin_0"), val = tensor<int32, [4]>([0, 384, 0, 0])];
            tensor<int32, [4]> var_3878_end_0 = const()[name = tensor<string, []>("op_3878_end_0"), val = tensor<int32, [4]>([1, 448, 1, 1500])];
            tensor<bool, [4]> var_3878_end_mask_0 = const()[name = tensor<string, []>("op_3878_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3878_cast_fp16 = slice_by_index(begin = var_3878_begin_0, end = var_3878_end_0, end_mask = var_3878_end_mask_0, x = value_cast_fp16)[name = tensor<string, []>("op_3878_cast_fp16")];
            tensor<int32, [4]> var_3882_begin_0 = const()[name = tensor<string, []>("op_3882_begin_0"), val = tensor<int32, [4]>([0, 448, 0, 0])];
            tensor<int32, [4]> var_3882_end_0 = const()[name = tensor<string, []>("op_3882_end_0"), val = tensor<int32, [4]>([1, 512, 1, 1500])];
            tensor<bool, [4]> var_3882_end_mask_0 = const()[name = tensor<string, []>("op_3882_end_mask_0"), val = tensor<bool, [4]>([true, false, true, true])];
            tensor<fp16, [1, 64, 1, 1500]> var_3882_cast_fp16 = slice_by_index(begin = var_3882_begin_0, end = var_3882_end_0, end_mask = var_3882_end_mask_0, x = value_cast_fp16)[name = tensor<string, []>("op_3882_cast_fp16")];
            tensor<string, []> var_3886_equation_0 = const()[name = tensor<string, []>("op_3886_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3886_cast_fp16 = einsum(equation = var_3886_equation_0, values = (var_3824_cast_fp16, var_3602_cast_fp16))[name = tensor<string, []>("op_3886_cast_fp16")];
            tensor<fp16, []> var_3887_to_fp16 = const()[name = tensor<string, []>("op_3887_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_321_cast_fp16 = mul(x = var_3886_cast_fp16, y = var_3887_to_fp16)[name = tensor<string, []>("aw_chunk_321_cast_fp16")];
            tensor<string, []> var_3890_equation_0 = const()[name = tensor<string, []>("op_3890_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3890_cast_fp16 = einsum(equation = var_3890_equation_0, values = (var_3824_cast_fp16, var_3609_cast_fp16))[name = tensor<string, []>("op_3890_cast_fp16")];
            tensor<fp16, []> var_3891_to_fp16 = const()[name = tensor<string, []>("op_3891_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_323_cast_fp16 = mul(x = var_3890_cast_fp16, y = var_3891_to_fp16)[name = tensor<string, []>("aw_chunk_323_cast_fp16")];
            tensor<string, []> var_3894_equation_0 = const()[name = tensor<string, []>("op_3894_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3894_cast_fp16 = einsum(equation = var_3894_equation_0, values = (var_3824_cast_fp16, var_3616_cast_fp16))[name = tensor<string, []>("op_3894_cast_fp16")];
            tensor<fp16, []> var_3895_to_fp16 = const()[name = tensor<string, []>("op_3895_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_325_cast_fp16 = mul(x = var_3894_cast_fp16, y = var_3895_to_fp16)[name = tensor<string, []>("aw_chunk_325_cast_fp16")];
            tensor<string, []> var_3898_equation_0 = const()[name = tensor<string, []>("op_3898_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3898_cast_fp16 = einsum(equation = var_3898_equation_0, values = (var_3824_cast_fp16, var_3623_cast_fp16))[name = tensor<string, []>("op_3898_cast_fp16")];
            tensor<fp16, []> var_3899_to_fp16 = const()[name = tensor<string, []>("op_3899_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_327_cast_fp16 = mul(x = var_3898_cast_fp16, y = var_3899_to_fp16)[name = tensor<string, []>("aw_chunk_327_cast_fp16")];
            tensor<string, []> var_3902_equation_0 = const()[name = tensor<string, []>("op_3902_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3902_cast_fp16 = einsum(equation = var_3902_equation_0, values = (var_3828_cast_fp16, var_3630_cast_fp16))[name = tensor<string, []>("op_3902_cast_fp16")];
            tensor<fp16, []> var_3903_to_fp16 = const()[name = tensor<string, []>("op_3903_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_329_cast_fp16 = mul(x = var_3902_cast_fp16, y = var_3903_to_fp16)[name = tensor<string, []>("aw_chunk_329_cast_fp16")];
            tensor<string, []> var_3906_equation_0 = const()[name = tensor<string, []>("op_3906_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3906_cast_fp16 = einsum(equation = var_3906_equation_0, values = (var_3828_cast_fp16, var_3637_cast_fp16))[name = tensor<string, []>("op_3906_cast_fp16")];
            tensor<fp16, []> var_3907_to_fp16 = const()[name = tensor<string, []>("op_3907_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_331_cast_fp16 = mul(x = var_3906_cast_fp16, y = var_3907_to_fp16)[name = tensor<string, []>("aw_chunk_331_cast_fp16")];
            tensor<string, []> var_3910_equation_0 = const()[name = tensor<string, []>("op_3910_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3910_cast_fp16 = einsum(equation = var_3910_equation_0, values = (var_3828_cast_fp16, var_3644_cast_fp16))[name = tensor<string, []>("op_3910_cast_fp16")];
            tensor<fp16, []> var_3911_to_fp16 = const()[name = tensor<string, []>("op_3911_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_333_cast_fp16 = mul(x = var_3910_cast_fp16, y = var_3911_to_fp16)[name = tensor<string, []>("aw_chunk_333_cast_fp16")];
            tensor<string, []> var_3914_equation_0 = const()[name = tensor<string, []>("op_3914_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3914_cast_fp16 = einsum(equation = var_3914_equation_0, values = (var_3828_cast_fp16, var_3651_cast_fp16))[name = tensor<string, []>("op_3914_cast_fp16")];
            tensor<fp16, []> var_3915_to_fp16 = const()[name = tensor<string, []>("op_3915_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_335_cast_fp16 = mul(x = var_3914_cast_fp16, y = var_3915_to_fp16)[name = tensor<string, []>("aw_chunk_335_cast_fp16")];
            tensor<string, []> var_3918_equation_0 = const()[name = tensor<string, []>("op_3918_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3918_cast_fp16 = einsum(equation = var_3918_equation_0, values = (var_3832_cast_fp16, var_3658_cast_fp16))[name = tensor<string, []>("op_3918_cast_fp16")];
            tensor<fp16, []> var_3919_to_fp16 = const()[name = tensor<string, []>("op_3919_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_337_cast_fp16 = mul(x = var_3918_cast_fp16, y = var_3919_to_fp16)[name = tensor<string, []>("aw_chunk_337_cast_fp16")];
            tensor<string, []> var_3922_equation_0 = const()[name = tensor<string, []>("op_3922_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3922_cast_fp16 = einsum(equation = var_3922_equation_0, values = (var_3832_cast_fp16, var_3665_cast_fp16))[name = tensor<string, []>("op_3922_cast_fp16")];
            tensor<fp16, []> var_3923_to_fp16 = const()[name = tensor<string, []>("op_3923_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_339_cast_fp16 = mul(x = var_3922_cast_fp16, y = var_3923_to_fp16)[name = tensor<string, []>("aw_chunk_339_cast_fp16")];
            tensor<string, []> var_3926_equation_0 = const()[name = tensor<string, []>("op_3926_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3926_cast_fp16 = einsum(equation = var_3926_equation_0, values = (var_3832_cast_fp16, var_3672_cast_fp16))[name = tensor<string, []>("op_3926_cast_fp16")];
            tensor<fp16, []> var_3927_to_fp16 = const()[name = tensor<string, []>("op_3927_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_341_cast_fp16 = mul(x = var_3926_cast_fp16, y = var_3927_to_fp16)[name = tensor<string, []>("aw_chunk_341_cast_fp16")];
            tensor<string, []> var_3930_equation_0 = const()[name = tensor<string, []>("op_3930_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3930_cast_fp16 = einsum(equation = var_3930_equation_0, values = (var_3832_cast_fp16, var_3679_cast_fp16))[name = tensor<string, []>("op_3930_cast_fp16")];
            tensor<fp16, []> var_3931_to_fp16 = const()[name = tensor<string, []>("op_3931_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_343_cast_fp16 = mul(x = var_3930_cast_fp16, y = var_3931_to_fp16)[name = tensor<string, []>("aw_chunk_343_cast_fp16")];
            tensor<string, []> var_3934_equation_0 = const()[name = tensor<string, []>("op_3934_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3934_cast_fp16 = einsum(equation = var_3934_equation_0, values = (var_3836_cast_fp16, var_3686_cast_fp16))[name = tensor<string, []>("op_3934_cast_fp16")];
            tensor<fp16, []> var_3935_to_fp16 = const()[name = tensor<string, []>("op_3935_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_345_cast_fp16 = mul(x = var_3934_cast_fp16, y = var_3935_to_fp16)[name = tensor<string, []>("aw_chunk_345_cast_fp16")];
            tensor<string, []> var_3938_equation_0 = const()[name = tensor<string, []>("op_3938_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3938_cast_fp16 = einsum(equation = var_3938_equation_0, values = (var_3836_cast_fp16, var_3693_cast_fp16))[name = tensor<string, []>("op_3938_cast_fp16")];
            tensor<fp16, []> var_3939_to_fp16 = const()[name = tensor<string, []>("op_3939_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_347_cast_fp16 = mul(x = var_3938_cast_fp16, y = var_3939_to_fp16)[name = tensor<string, []>("aw_chunk_347_cast_fp16")];
            tensor<string, []> var_3942_equation_0 = const()[name = tensor<string, []>("op_3942_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3942_cast_fp16 = einsum(equation = var_3942_equation_0, values = (var_3836_cast_fp16, var_3700_cast_fp16))[name = tensor<string, []>("op_3942_cast_fp16")];
            tensor<fp16, []> var_3943_to_fp16 = const()[name = tensor<string, []>("op_3943_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_349_cast_fp16 = mul(x = var_3942_cast_fp16, y = var_3943_to_fp16)[name = tensor<string, []>("aw_chunk_349_cast_fp16")];
            tensor<string, []> var_3946_equation_0 = const()[name = tensor<string, []>("op_3946_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3946_cast_fp16 = einsum(equation = var_3946_equation_0, values = (var_3836_cast_fp16, var_3707_cast_fp16))[name = tensor<string, []>("op_3946_cast_fp16")];
            tensor<fp16, []> var_3947_to_fp16 = const()[name = tensor<string, []>("op_3947_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_351_cast_fp16 = mul(x = var_3946_cast_fp16, y = var_3947_to_fp16)[name = tensor<string, []>("aw_chunk_351_cast_fp16")];
            tensor<string, []> var_3950_equation_0 = const()[name = tensor<string, []>("op_3950_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3950_cast_fp16 = einsum(equation = var_3950_equation_0, values = (var_3840_cast_fp16, var_3714_cast_fp16))[name = tensor<string, []>("op_3950_cast_fp16")];
            tensor<fp16, []> var_3951_to_fp16 = const()[name = tensor<string, []>("op_3951_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_353_cast_fp16 = mul(x = var_3950_cast_fp16, y = var_3951_to_fp16)[name = tensor<string, []>("aw_chunk_353_cast_fp16")];
            tensor<string, []> var_3954_equation_0 = const()[name = tensor<string, []>("op_3954_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3954_cast_fp16 = einsum(equation = var_3954_equation_0, values = (var_3840_cast_fp16, var_3721_cast_fp16))[name = tensor<string, []>("op_3954_cast_fp16")];
            tensor<fp16, []> var_3955_to_fp16 = const()[name = tensor<string, []>("op_3955_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_355_cast_fp16 = mul(x = var_3954_cast_fp16, y = var_3955_to_fp16)[name = tensor<string, []>("aw_chunk_355_cast_fp16")];
            tensor<string, []> var_3958_equation_0 = const()[name = tensor<string, []>("op_3958_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3958_cast_fp16 = einsum(equation = var_3958_equation_0, values = (var_3840_cast_fp16, var_3728_cast_fp16))[name = tensor<string, []>("op_3958_cast_fp16")];
            tensor<fp16, []> var_3959_to_fp16 = const()[name = tensor<string, []>("op_3959_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_357_cast_fp16 = mul(x = var_3958_cast_fp16, y = var_3959_to_fp16)[name = tensor<string, []>("aw_chunk_357_cast_fp16")];
            tensor<string, []> var_3962_equation_0 = const()[name = tensor<string, []>("op_3962_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3962_cast_fp16 = einsum(equation = var_3962_equation_0, values = (var_3840_cast_fp16, var_3735_cast_fp16))[name = tensor<string, []>("op_3962_cast_fp16")];
            tensor<fp16, []> var_3963_to_fp16 = const()[name = tensor<string, []>("op_3963_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_359_cast_fp16 = mul(x = var_3962_cast_fp16, y = var_3963_to_fp16)[name = tensor<string, []>("aw_chunk_359_cast_fp16")];
            tensor<string, []> var_3966_equation_0 = const()[name = tensor<string, []>("op_3966_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3966_cast_fp16 = einsum(equation = var_3966_equation_0, values = (var_3844_cast_fp16, var_3742_cast_fp16))[name = tensor<string, []>("op_3966_cast_fp16")];
            tensor<fp16, []> var_3967_to_fp16 = const()[name = tensor<string, []>("op_3967_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_361_cast_fp16 = mul(x = var_3966_cast_fp16, y = var_3967_to_fp16)[name = tensor<string, []>("aw_chunk_361_cast_fp16")];
            tensor<string, []> var_3970_equation_0 = const()[name = tensor<string, []>("op_3970_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3970_cast_fp16 = einsum(equation = var_3970_equation_0, values = (var_3844_cast_fp16, var_3749_cast_fp16))[name = tensor<string, []>("op_3970_cast_fp16")];
            tensor<fp16, []> var_3971_to_fp16 = const()[name = tensor<string, []>("op_3971_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_363_cast_fp16 = mul(x = var_3970_cast_fp16, y = var_3971_to_fp16)[name = tensor<string, []>("aw_chunk_363_cast_fp16")];
            tensor<string, []> var_3974_equation_0 = const()[name = tensor<string, []>("op_3974_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3974_cast_fp16 = einsum(equation = var_3974_equation_0, values = (var_3844_cast_fp16, var_3756_cast_fp16))[name = tensor<string, []>("op_3974_cast_fp16")];
            tensor<fp16, []> var_3975_to_fp16 = const()[name = tensor<string, []>("op_3975_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_365_cast_fp16 = mul(x = var_3974_cast_fp16, y = var_3975_to_fp16)[name = tensor<string, []>("aw_chunk_365_cast_fp16")];
            tensor<string, []> var_3978_equation_0 = const()[name = tensor<string, []>("op_3978_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3978_cast_fp16 = einsum(equation = var_3978_equation_0, values = (var_3844_cast_fp16, var_3763_cast_fp16))[name = tensor<string, []>("op_3978_cast_fp16")];
            tensor<fp16, []> var_3979_to_fp16 = const()[name = tensor<string, []>("op_3979_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_367_cast_fp16 = mul(x = var_3978_cast_fp16, y = var_3979_to_fp16)[name = tensor<string, []>("aw_chunk_367_cast_fp16")];
            tensor<string, []> var_3982_equation_0 = const()[name = tensor<string, []>("op_3982_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3982_cast_fp16 = einsum(equation = var_3982_equation_0, values = (var_3848_cast_fp16, var_3770_cast_fp16))[name = tensor<string, []>("op_3982_cast_fp16")];
            tensor<fp16, []> var_3983_to_fp16 = const()[name = tensor<string, []>("op_3983_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_369_cast_fp16 = mul(x = var_3982_cast_fp16, y = var_3983_to_fp16)[name = tensor<string, []>("aw_chunk_369_cast_fp16")];
            tensor<string, []> var_3986_equation_0 = const()[name = tensor<string, []>("op_3986_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3986_cast_fp16 = einsum(equation = var_3986_equation_0, values = (var_3848_cast_fp16, var_3777_cast_fp16))[name = tensor<string, []>("op_3986_cast_fp16")];
            tensor<fp16, []> var_3987_to_fp16 = const()[name = tensor<string, []>("op_3987_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_371_cast_fp16 = mul(x = var_3986_cast_fp16, y = var_3987_to_fp16)[name = tensor<string, []>("aw_chunk_371_cast_fp16")];
            tensor<string, []> var_3990_equation_0 = const()[name = tensor<string, []>("op_3990_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3990_cast_fp16 = einsum(equation = var_3990_equation_0, values = (var_3848_cast_fp16, var_3784_cast_fp16))[name = tensor<string, []>("op_3990_cast_fp16")];
            tensor<fp16, []> var_3991_to_fp16 = const()[name = tensor<string, []>("op_3991_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_373_cast_fp16 = mul(x = var_3990_cast_fp16, y = var_3991_to_fp16)[name = tensor<string, []>("aw_chunk_373_cast_fp16")];
            tensor<string, []> var_3994_equation_0 = const()[name = tensor<string, []>("op_3994_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3994_cast_fp16 = einsum(equation = var_3994_equation_0, values = (var_3848_cast_fp16, var_3791_cast_fp16))[name = tensor<string, []>("op_3994_cast_fp16")];
            tensor<fp16, []> var_3995_to_fp16 = const()[name = tensor<string, []>("op_3995_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_375_cast_fp16 = mul(x = var_3994_cast_fp16, y = var_3995_to_fp16)[name = tensor<string, []>("aw_chunk_375_cast_fp16")];
            tensor<string, []> var_3998_equation_0 = const()[name = tensor<string, []>("op_3998_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_3998_cast_fp16 = einsum(equation = var_3998_equation_0, values = (var_3852_cast_fp16, var_3798_cast_fp16))[name = tensor<string, []>("op_3998_cast_fp16")];
            tensor<fp16, []> var_3999_to_fp16 = const()[name = tensor<string, []>("op_3999_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_377_cast_fp16 = mul(x = var_3998_cast_fp16, y = var_3999_to_fp16)[name = tensor<string, []>("aw_chunk_377_cast_fp16")];
            tensor<string, []> var_4002_equation_0 = const()[name = tensor<string, []>("op_4002_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_4002_cast_fp16 = einsum(equation = var_4002_equation_0, values = (var_3852_cast_fp16, var_3805_cast_fp16))[name = tensor<string, []>("op_4002_cast_fp16")];
            tensor<fp16, []> var_4003_to_fp16 = const()[name = tensor<string, []>("op_4003_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_379_cast_fp16 = mul(x = var_4002_cast_fp16, y = var_4003_to_fp16)[name = tensor<string, []>("aw_chunk_379_cast_fp16")];
            tensor<string, []> var_4006_equation_0 = const()[name = tensor<string, []>("op_4006_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_4006_cast_fp16 = einsum(equation = var_4006_equation_0, values = (var_3852_cast_fp16, var_3812_cast_fp16))[name = tensor<string, []>("op_4006_cast_fp16")];
            tensor<fp16, []> var_4007_to_fp16 = const()[name = tensor<string, []>("op_4007_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_381_cast_fp16 = mul(x = var_4006_cast_fp16, y = var_4007_to_fp16)[name = tensor<string, []>("aw_chunk_381_cast_fp16")];
            tensor<string, []> var_4010_equation_0 = const()[name = tensor<string, []>("op_4010_equation_0"), val = tensor<string, []>("bkhc,bchq->bkhq")];
            tensor<fp16, [1, 1500, 1, 375]> var_4010_cast_fp16 = einsum(equation = var_4010_equation_0, values = (var_3852_cast_fp16, var_3819_cast_fp16))[name = tensor<string, []>("op_4010_cast_fp16")];
            tensor<fp16, []> var_4011_to_fp16 = const()[name = tensor<string, []>("op_4011_to_fp16"), val = tensor<fp16, []>(0x1p-3)];
            tensor<fp16, [1, 1500, 1, 375]> aw_chunk_cast_fp16 = mul(x = var_4010_cast_fp16, y = var_4011_to_fp16)[name = tensor<string, []>("aw_chunk_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4013_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_321_cast_fp16)[name = tensor<string, []>("op_4013_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4014_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_323_cast_fp16)[name = tensor<string, []>("op_4014_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4015_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_325_cast_fp16)[name = tensor<string, []>("op_4015_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4016_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_327_cast_fp16)[name = tensor<string, []>("op_4016_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4017_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_329_cast_fp16)[name = tensor<string, []>("op_4017_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4018_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_331_cast_fp16)[name = tensor<string, []>("op_4018_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4019_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_333_cast_fp16)[name = tensor<string, []>("op_4019_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4020_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_335_cast_fp16)[name = tensor<string, []>("op_4020_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4021_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_337_cast_fp16)[name = tensor<string, []>("op_4021_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4022_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_339_cast_fp16)[name = tensor<string, []>("op_4022_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4023_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_341_cast_fp16)[name = tensor<string, []>("op_4023_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4024_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_343_cast_fp16)[name = tensor<string, []>("op_4024_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4025_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_345_cast_fp16)[name = tensor<string, []>("op_4025_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4026_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_347_cast_fp16)[name = tensor<string, []>("op_4026_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4027_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_349_cast_fp16)[name = tensor<string, []>("op_4027_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4028_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_351_cast_fp16)[name = tensor<string, []>("op_4028_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4029_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_353_cast_fp16)[name = tensor<string, []>("op_4029_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4030_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_355_cast_fp16)[name = tensor<string, []>("op_4030_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4031_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_357_cast_fp16)[name = tensor<string, []>("op_4031_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4032_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_359_cast_fp16)[name = tensor<string, []>("op_4032_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4033_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_361_cast_fp16)[name = tensor<string, []>("op_4033_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4034_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_363_cast_fp16)[name = tensor<string, []>("op_4034_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4035_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_365_cast_fp16)[name = tensor<string, []>("op_4035_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4036_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_367_cast_fp16)[name = tensor<string, []>("op_4036_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4037_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_369_cast_fp16)[name = tensor<string, []>("op_4037_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4038_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_371_cast_fp16)[name = tensor<string, []>("op_4038_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4039_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_373_cast_fp16)[name = tensor<string, []>("op_4039_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4040_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_375_cast_fp16)[name = tensor<string, []>("op_4040_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4041_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_377_cast_fp16)[name = tensor<string, []>("op_4041_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4042_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_379_cast_fp16)[name = tensor<string, []>("op_4042_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4043_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_381_cast_fp16)[name = tensor<string, []>("op_4043_cast_fp16")];
            tensor<fp16, [1, 1500, 1, 375]> var_4044_cast_fp16 = softmax(axis = var_3510, x = aw_chunk_cast_fp16)[name = tensor<string, []>("op_4044_cast_fp16")];
            tensor<string, []> var_4046_equation_0 = const()[name = tensor<string, []>("op_4046_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4046_cast_fp16 = einsum(equation = var_4046_equation_0, values = (var_3854_cast_fp16, var_4013_cast_fp16))[name = tensor<string, []>("op_4046_cast_fp16")];
            tensor<string, []> var_4048_equation_0 = const()[name = tensor<string, []>("op_4048_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4048_cast_fp16 = einsum(equation = var_4048_equation_0, values = (var_3854_cast_fp16, var_4014_cast_fp16))[name = tensor<string, []>("op_4048_cast_fp16")];
            tensor<string, []> var_4050_equation_0 = const()[name = tensor<string, []>("op_4050_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4050_cast_fp16 = einsum(equation = var_4050_equation_0, values = (var_3854_cast_fp16, var_4015_cast_fp16))[name = tensor<string, []>("op_4050_cast_fp16")];
            tensor<string, []> var_4052_equation_0 = const()[name = tensor<string, []>("op_4052_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4052_cast_fp16 = einsum(equation = var_4052_equation_0, values = (var_3854_cast_fp16, var_4016_cast_fp16))[name = tensor<string, []>("op_4052_cast_fp16")];
            tensor<string, []> var_4054_equation_0 = const()[name = tensor<string, []>("op_4054_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4054_cast_fp16 = einsum(equation = var_4054_equation_0, values = (var_3858_cast_fp16, var_4017_cast_fp16))[name = tensor<string, []>("op_4054_cast_fp16")];
            tensor<string, []> var_4056_equation_0 = const()[name = tensor<string, []>("op_4056_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4056_cast_fp16 = einsum(equation = var_4056_equation_0, values = (var_3858_cast_fp16, var_4018_cast_fp16))[name = tensor<string, []>("op_4056_cast_fp16")];
            tensor<string, []> var_4058_equation_0 = const()[name = tensor<string, []>("op_4058_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4058_cast_fp16 = einsum(equation = var_4058_equation_0, values = (var_3858_cast_fp16, var_4019_cast_fp16))[name = tensor<string, []>("op_4058_cast_fp16")];
            tensor<string, []> var_4060_equation_0 = const()[name = tensor<string, []>("op_4060_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4060_cast_fp16 = einsum(equation = var_4060_equation_0, values = (var_3858_cast_fp16, var_4020_cast_fp16))[name = tensor<string, []>("op_4060_cast_fp16")];
            tensor<string, []> var_4062_equation_0 = const()[name = tensor<string, []>("op_4062_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4062_cast_fp16 = einsum(equation = var_4062_equation_0, values = (var_3862_cast_fp16, var_4021_cast_fp16))[name = tensor<string, []>("op_4062_cast_fp16")];
            tensor<string, []> var_4064_equation_0 = const()[name = tensor<string, []>("op_4064_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4064_cast_fp16 = einsum(equation = var_4064_equation_0, values = (var_3862_cast_fp16, var_4022_cast_fp16))[name = tensor<string, []>("op_4064_cast_fp16")];
            tensor<string, []> var_4066_equation_0 = const()[name = tensor<string, []>("op_4066_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4066_cast_fp16 = einsum(equation = var_4066_equation_0, values = (var_3862_cast_fp16, var_4023_cast_fp16))[name = tensor<string, []>("op_4066_cast_fp16")];
            tensor<string, []> var_4068_equation_0 = const()[name = tensor<string, []>("op_4068_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4068_cast_fp16 = einsum(equation = var_4068_equation_0, values = (var_3862_cast_fp16, var_4024_cast_fp16))[name = tensor<string, []>("op_4068_cast_fp16")];
            tensor<string, []> var_4070_equation_0 = const()[name = tensor<string, []>("op_4070_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4070_cast_fp16 = einsum(equation = var_4070_equation_0, values = (var_3866_cast_fp16, var_4025_cast_fp16))[name = tensor<string, []>("op_4070_cast_fp16")];
            tensor<string, []> var_4072_equation_0 = const()[name = tensor<string, []>("op_4072_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4072_cast_fp16 = einsum(equation = var_4072_equation_0, values = (var_3866_cast_fp16, var_4026_cast_fp16))[name = tensor<string, []>("op_4072_cast_fp16")];
            tensor<string, []> var_4074_equation_0 = const()[name = tensor<string, []>("op_4074_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4074_cast_fp16 = einsum(equation = var_4074_equation_0, values = (var_3866_cast_fp16, var_4027_cast_fp16))[name = tensor<string, []>("op_4074_cast_fp16")];
            tensor<string, []> var_4076_equation_0 = const()[name = tensor<string, []>("op_4076_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4076_cast_fp16 = einsum(equation = var_4076_equation_0, values = (var_3866_cast_fp16, var_4028_cast_fp16))[name = tensor<string, []>("op_4076_cast_fp16")];
            tensor<string, []> var_4078_equation_0 = const()[name = tensor<string, []>("op_4078_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4078_cast_fp16 = einsum(equation = var_4078_equation_0, values = (var_3870_cast_fp16, var_4029_cast_fp16))[name = tensor<string, []>("op_4078_cast_fp16")];
            tensor<string, []> var_4080_equation_0 = const()[name = tensor<string, []>("op_4080_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4080_cast_fp16 = einsum(equation = var_4080_equation_0, values = (var_3870_cast_fp16, var_4030_cast_fp16))[name = tensor<string, []>("op_4080_cast_fp16")];
            tensor<string, []> var_4082_equation_0 = const()[name = tensor<string, []>("op_4082_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4082_cast_fp16 = einsum(equation = var_4082_equation_0, values = (var_3870_cast_fp16, var_4031_cast_fp16))[name = tensor<string, []>("op_4082_cast_fp16")];
            tensor<string, []> var_4084_equation_0 = const()[name = tensor<string, []>("op_4084_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4084_cast_fp16 = einsum(equation = var_4084_equation_0, values = (var_3870_cast_fp16, var_4032_cast_fp16))[name = tensor<string, []>("op_4084_cast_fp16")];
            tensor<string, []> var_4086_equation_0 = const()[name = tensor<string, []>("op_4086_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4086_cast_fp16 = einsum(equation = var_4086_equation_0, values = (var_3874_cast_fp16, var_4033_cast_fp16))[name = tensor<string, []>("op_4086_cast_fp16")];
            tensor<string, []> var_4088_equation_0 = const()[name = tensor<string, []>("op_4088_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4088_cast_fp16 = einsum(equation = var_4088_equation_0, values = (var_3874_cast_fp16, var_4034_cast_fp16))[name = tensor<string, []>("op_4088_cast_fp16")];
            tensor<string, []> var_4090_equation_0 = const()[name = tensor<string, []>("op_4090_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4090_cast_fp16 = einsum(equation = var_4090_equation_0, values = (var_3874_cast_fp16, var_4035_cast_fp16))[name = tensor<string, []>("op_4090_cast_fp16")];
            tensor<string, []> var_4092_equation_0 = const()[name = tensor<string, []>("op_4092_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4092_cast_fp16 = einsum(equation = var_4092_equation_0, values = (var_3874_cast_fp16, var_4036_cast_fp16))[name = tensor<string, []>("op_4092_cast_fp16")];
            tensor<string, []> var_4094_equation_0 = const()[name = tensor<string, []>("op_4094_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4094_cast_fp16 = einsum(equation = var_4094_equation_0, values = (var_3878_cast_fp16, var_4037_cast_fp16))[name = tensor<string, []>("op_4094_cast_fp16")];
            tensor<string, []> var_4096_equation_0 = const()[name = tensor<string, []>("op_4096_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4096_cast_fp16 = einsum(equation = var_4096_equation_0, values = (var_3878_cast_fp16, var_4038_cast_fp16))[name = tensor<string, []>("op_4096_cast_fp16")];
            tensor<string, []> var_4098_equation_0 = const()[name = tensor<string, []>("op_4098_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4098_cast_fp16 = einsum(equation = var_4098_equation_0, values = (var_3878_cast_fp16, var_4039_cast_fp16))[name = tensor<string, []>("op_4098_cast_fp16")];
            tensor<string, []> var_4100_equation_0 = const()[name = tensor<string, []>("op_4100_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4100_cast_fp16 = einsum(equation = var_4100_equation_0, values = (var_3878_cast_fp16, var_4040_cast_fp16))[name = tensor<string, []>("op_4100_cast_fp16")];
            tensor<string, []> var_4102_equation_0 = const()[name = tensor<string, []>("op_4102_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4102_cast_fp16 = einsum(equation = var_4102_equation_0, values = (var_3882_cast_fp16, var_4041_cast_fp16))[name = tensor<string, []>("op_4102_cast_fp16")];
            tensor<string, []> var_4104_equation_0 = const()[name = tensor<string, []>("op_4104_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4104_cast_fp16 = einsum(equation = var_4104_equation_0, values = (var_3882_cast_fp16, var_4042_cast_fp16))[name = tensor<string, []>("op_4104_cast_fp16")];
            tensor<string, []> var_4106_equation_0 = const()[name = tensor<string, []>("op_4106_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4106_cast_fp16 = einsum(equation = var_4106_equation_0, values = (var_3882_cast_fp16, var_4043_cast_fp16))[name = tensor<string, []>("op_4106_cast_fp16")];
            tensor<string, []> var_4108_equation_0 = const()[name = tensor<string, []>("op_4108_equation_0"), val = tensor<string, []>("bchk,bkhq->bchq")];
            tensor<fp16, [1, 64, 1, 375]> var_4108_cast_fp16 = einsum(equation = var_4108_equation_0, values = (var_3882_cast_fp16, var_4044_cast_fp16))[name = tensor<string, []>("op_4108_cast_fp16")];
            tensor<bool, []> var_4110_interleave_0 = const()[name = tensor<string, []>("op_4110_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_4110_cast_fp16 = concat(axis = var_3497, interleave = var_4110_interleave_0, values = (var_4046_cast_fp16, var_4048_cast_fp16, var_4050_cast_fp16, var_4052_cast_fp16))[name = tensor<string, []>("op_4110_cast_fp16")];
            tensor<bool, []> var_4112_interleave_0 = const()[name = tensor<string, []>("op_4112_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_4112_cast_fp16 = concat(axis = var_3497, interleave = var_4112_interleave_0, values = (var_4054_cast_fp16, var_4056_cast_fp16, var_4058_cast_fp16, var_4060_cast_fp16))[name = tensor<string, []>("op_4112_cast_fp16")];
            tensor<bool, []> var_4114_interleave_0 = const()[name = tensor<string, []>("op_4114_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_4114_cast_fp16 = concat(axis = var_3497, interleave = var_4114_interleave_0, values = (var_4062_cast_fp16, var_4064_cast_fp16, var_4066_cast_fp16, var_4068_cast_fp16))[name = tensor<string, []>("op_4114_cast_fp16")];
            tensor<bool, []> var_4116_interleave_0 = const()[name = tensor<string, []>("op_4116_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_4116_cast_fp16 = concat(axis = var_3497, interleave = var_4116_interleave_0, values = (var_4070_cast_fp16, var_4072_cast_fp16, var_4074_cast_fp16, var_4076_cast_fp16))[name = tensor<string, []>("op_4116_cast_fp16")];
            tensor<bool, []> var_4118_interleave_0 = const()[name = tensor<string, []>("op_4118_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_4118_cast_fp16 = concat(axis = var_3497, interleave = var_4118_interleave_0, values = (var_4078_cast_fp16, var_4080_cast_fp16, var_4082_cast_fp16, var_4084_cast_fp16))[name = tensor<string, []>("op_4118_cast_fp16")];
            tensor<bool, []> var_4120_interleave_0 = const()[name = tensor<string, []>("op_4120_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_4120_cast_fp16 = concat(axis = var_3497, interleave = var_4120_interleave_0, values = (var_4086_cast_fp16, var_4088_cast_fp16, var_4090_cast_fp16, var_4092_cast_fp16))[name = tensor<string, []>("op_4120_cast_fp16")];
            tensor<bool, []> var_4122_interleave_0 = const()[name = tensor<string, []>("op_4122_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_4122_cast_fp16 = concat(axis = var_3497, interleave = var_4122_interleave_0, values = (var_4094_cast_fp16, var_4096_cast_fp16, var_4098_cast_fp16, var_4100_cast_fp16))[name = tensor<string, []>("op_4122_cast_fp16")];
            tensor<bool, []> var_4124_interleave_0 = const()[name = tensor<string, []>("op_4124_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 64, 1, 1500]> var_4124_cast_fp16 = concat(axis = var_3497, interleave = var_4124_interleave_0, values = (var_4102_cast_fp16, var_4104_cast_fp16, var_4106_cast_fp16, var_4108_cast_fp16))[name = tensor<string, []>("op_4124_cast_fp16")];
            tensor<bool, []> input_41_interleave_0 = const()[name = tensor<string, []>("input_41_interleave_0"), val = tensor<bool, []>(false)];
            tensor<fp16, [1, 512, 1, 1500]> input_41_cast_fp16 = concat(axis = var_3510, interleave = input_41_interleave_0, values = (var_4110_cast_fp16, var_4112_cast_fp16, var_4114_cast_fp16, var_4116_cast_fp16, var_4118_cast_fp16, var_4120_cast_fp16, var_4122_cast_fp16, var_4124_cast_fp16))[name = tensor<string, []>("input_41_cast_fp16")];
            tensor<int32, [2]> var_4129 = const()[name = tensor<string, []>("op_4129"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_4131 = const()[name = tensor<string, []>("op_4131"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> obj_pad_type_0 = const()[name = tensor<string, []>("obj_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> obj_pad_0 = const()[name = tensor<string, []>("obj_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 512, 1, 1]> layers_5_self_attn_o_proj_weight_to_fp16 = const()[name = tensor<string, []>("layers_5_self_attn_o_proj_weight_to_fp16"), val = tensor<fp16, [512, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36460160)))];
            tensor<fp16, [512]> layers_5_self_attn_o_proj_bias_to_fp16 = const()[name = tensor<string, []>("layers_5_self_attn_o_proj_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36984512)))];
            tensor<fp16, [1, 512, 1, 1500]> obj_cast_fp16 = conv(bias = layers_5_self_attn_o_proj_bias_to_fp16, dilations = var_4131, groups = var_3510, pad = obj_pad_0, pad_type = obj_pad_type_0, strides = var_4129, weight = layers_5_self_attn_o_proj_weight_to_fp16, x = input_41_cast_fp16)[name = tensor<string, []>("obj_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_23_cast_fp16 = add(x = inputs_21_cast_fp16, y = obj_cast_fp16)[name = tensor<string, []>("inputs_23_cast_fp16")];
            tensor<int32, [1]> var_4137 = const()[name = tensor<string, []>("op_4137"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_23_cast_fp16 = reduce_mean(axes = var_4137, keep_dims = var_3511, x = inputs_23_cast_fp16)[name = tensor<string, []>("channels_mean_23_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_23_cast_fp16 = sub(x = inputs_23_cast_fp16, y = channels_mean_23_cast_fp16)[name = tensor<string, []>("zero_mean_23_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_23_cast_fp16 = mul(x = zero_mean_23_cast_fp16, y = zero_mean_23_cast_fp16)[name = tensor<string, []>("zero_mean_sq_23_cast_fp16")];
            tensor<int32, [1]> var_4141 = const()[name = tensor<string, []>("op_4141"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_4142_cast_fp16 = reduce_mean(axes = var_4141, keep_dims = var_3511, x = zero_mean_sq_23_cast_fp16)[name = tensor<string, []>("op_4142_cast_fp16")];
            tensor<fp16, []> var_4143_to_fp16 = const()[name = tensor<string, []>("op_4143_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_4144_cast_fp16 = add(x = var_4142_cast_fp16, y = var_4143_to_fp16)[name = tensor<string, []>("op_4144_cast_fp16")];
            tensor<fp16, []> denom_23_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_23_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_23_cast_fp16 = rsqrt(epsilon = denom_23_epsilon_0_to_fp16, x = var_4144_cast_fp16)[name = tensor<string, []>("denom_23_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_23_cast_fp16 = mul(x = zero_mean_23_cast_fp16, y = denom_23_cast_fp16)[name = tensor<string, []>("out_23_cast_fp16")];
            tensor<fp16, [512]> input_43_gamma_0_to_fp16 = const()[name = tensor<string, []>("input_43_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36985600)))];
            tensor<fp16, [512]> input_43_beta_0_to_fp16 = const()[name = tensor<string, []>("input_43_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36986688)))];
            tensor<fp16, []> input_43_epsilon_0_to_fp16 = const()[name = tensor<string, []>("input_43_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> input_43_cast_fp16 = batch_norm(beta = input_43_beta_0_to_fp16, epsilon = input_43_epsilon_0_to_fp16, gamma = input_43_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_23_cast_fp16)[name = tensor<string, []>("input_43_cast_fp16")];
            tensor<int32, [2]> var_4155 = const()[name = tensor<string, []>("op_4155"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_4157 = const()[name = tensor<string, []>("op_4157"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> input_45_pad_type_0 = const()[name = tensor<string, []>("input_45_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> input_45_pad_0 = const()[name = tensor<string, []>("input_45_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [2048, 512, 1, 1]> layers_5_fc1_weight_to_fp16 = const()[name = tensor<string, []>("layers_5_fc1_weight_to_fp16"), val = tensor<fp16, [2048, 512, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(36987776)))];
            tensor<fp16, [2048]> layers_5_fc1_bias_to_fp16 = const()[name = tensor<string, []>("layers_5_fc1_bias_to_fp16"), val = tensor<fp16, [2048]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39084992)))];
            tensor<fp16, [1, 2048, 1, 1500]> input_45_cast_fp16 = conv(bias = layers_5_fc1_bias_to_fp16, dilations = var_4157, groups = var_3510, pad = input_45_pad_0, pad_type = input_45_pad_type_0, strides = var_4155, weight = layers_5_fc1_weight_to_fp16, x = input_43_cast_fp16)[name = tensor<string, []>("input_45_cast_fp16")];
            tensor<string, []> input_mode_0 = const()[name = tensor<string, []>("input_mode_0"), val = tensor<string, []>("EXACT")];
            tensor<fp16, [1, 2048, 1, 1500]> input_cast_fp16 = gelu(mode = input_mode_0, x = input_45_cast_fp16)[name = tensor<string, []>("input_cast_fp16")];
            tensor<int32, [2]> var_4163 = const()[name = tensor<string, []>("op_4163"), val = tensor<int32, [2]>([1, 1])];
            tensor<int32, [2]> var_4165 = const()[name = tensor<string, []>("op_4165"), val = tensor<int32, [2]>([1, 1])];
            tensor<string, []> hidden_states_pad_type_0 = const()[name = tensor<string, []>("hidden_states_pad_type_0"), val = tensor<string, []>("custom")];
            tensor<int32, [4]> hidden_states_pad_0 = const()[name = tensor<string, []>("hidden_states_pad_0"), val = tensor<int32, [4]>([0, 0, 0, 0])];
            tensor<fp16, [512, 2048, 1, 1]> layers_5_fc2_weight_to_fp16 = const()[name = tensor<string, []>("layers_5_fc2_weight_to_fp16"), val = tensor<fp16, [512, 2048, 1, 1]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(39089152)))];
            tensor<fp16, [512]> layers_5_fc2_bias_to_fp16 = const()[name = tensor<string, []>("layers_5_fc2_bias_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(41186368)))];
            tensor<fp16, [1, 512, 1, 1500]> hidden_states_cast_fp16 = conv(bias = layers_5_fc2_bias_to_fp16, dilations = var_4165, groups = var_3510, pad = hidden_states_pad_0, pad_type = hidden_states_pad_type_0, strides = var_4163, weight = layers_5_fc2_weight_to_fp16, x = input_cast_fp16)[name = tensor<string, []>("hidden_states_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> inputs_cast_fp16 = add(x = inputs_23_cast_fp16, y = hidden_states_cast_fp16)[name = tensor<string, []>("inputs_cast_fp16")];
            tensor<bool, []> var_4171 = const()[name = tensor<string, []>("op_4171"), val = tensor<bool, []>(true)];
            tensor<int32, [1]> var_4175 = const()[name = tensor<string, []>("op_4175"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> channels_mean_cast_fp16 = reduce_mean(axes = var_4175, keep_dims = var_4171, x = inputs_cast_fp16)[name = tensor<string, []>("channels_mean_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_cast_fp16 = sub(x = inputs_cast_fp16, y = channels_mean_cast_fp16)[name = tensor<string, []>("zero_mean_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> zero_mean_sq_cast_fp16 = mul(x = zero_mean_cast_fp16, y = zero_mean_cast_fp16)[name = tensor<string, []>("zero_mean_sq_cast_fp16")];
            tensor<int32, [1]> var_4179 = const()[name = tensor<string, []>("op_4179"), val = tensor<int32, [1]>([1])];
            tensor<fp16, [1, 1, 1, 1500]> var_4180_cast_fp16 = reduce_mean(axes = var_4179, keep_dims = var_4171, x = zero_mean_sq_cast_fp16)[name = tensor<string, []>("op_4180_cast_fp16")];
            tensor<fp16, []> var_4181_to_fp16 = const()[name = tensor<string, []>("op_4181_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 1, 1, 1500]> var_4182_cast_fp16 = add(x = var_4180_cast_fp16, y = var_4181_to_fp16)[name = tensor<string, []>("op_4182_cast_fp16")];
            tensor<fp16, []> denom_epsilon_0_to_fp16 = const()[name = tensor<string, []>("denom_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1p-24)];
            tensor<fp16, [1, 1, 1, 1500]> denom_cast_fp16 = rsqrt(epsilon = denom_epsilon_0_to_fp16, x = var_4182_cast_fp16)[name = tensor<string, []>("denom_cast_fp16")];
            tensor<fp16, [1, 512, 1, 1500]> out_cast_fp16 = mul(x = zero_mean_cast_fp16, y = denom_cast_fp16)[name = tensor<string, []>("out_cast_fp16")];
            tensor<fp16, [512]> encoder_output_embeds_type_fp32_gamma_0_to_fp16 = const()[name = tensor<string, []>("encoder_output_embeds_type_fp32_gamma_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(41187456)))];
            tensor<fp16, [512]> encoder_output_embeds_type_fp32_beta_0_to_fp16 = const()[name = tensor<string, []>("encoder_output_embeds_type_fp32_beta_0_to_fp16"), val = tensor<fp16, [512]>(BLOBFILE(path = tensor<string, []>("@model_path/weights/weight.bin"), offset = tensor<uint64, []>(41188544)))];
            tensor<fp16, []> encoder_output_embeds_type_fp32_epsilon_0_to_fp16 = const()[name = tensor<string, []>("encoder_output_embeds_type_fp32_epsilon_0_to_fp16"), val = tensor<fp16, []>(0x1.5p-17)];
            tensor<fp16, [1, 512, 1, 1500]> encoder_output_embeds = batch_norm(beta = encoder_output_embeds_type_fp32_beta_0_to_fp16, epsilon = encoder_output_embeds_type_fp32_epsilon_0_to_fp16, gamma = encoder_output_embeds_type_fp32_gamma_0_to_fp16, mean = obj_1_mean_0_to_fp16, variance = obj_1_variance_0_to_fp16, x = out_cast_fp16)[name = tensor<string, []>("encoder_output_embeds_type_fp32_cast_fp16")];
        } -> (encoder_output_embeds);
}