program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "3505.3.2"}, {"coremlc-version", "3505.4.1"}, {"coremltools-component-torch", "2.9.1"}, {"coremltools-source-dialect", "TorchScript"}, {"coremltools-version", "9.0"}})] { func main(tensor bos_emb, tensor cache0, tensor cache1, tensor cache2, tensor cache3, tensor cache4, tensor cache5, tensor position0, tensor position1, tensor position2, tensor position3, tensor position4, tensor position5, tensor sequence) { tensor input_linear_weight = const()[name = tensor("input_linear_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor norm0_1_bias = const()[name = tensor("norm0_1_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(131200)))]; tensor norm0_1_weight = const()[name = tensor("norm0_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135360)))]; tensor attn0_in_proj_weight = const()[name = tensor("attn0_in_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(139520)))]; tensor attn0_out_proj_weight = const()[name = tensor("attn0_out_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12722496)))]; tensor norm0_2_bias = const()[name = tensor("norm0_2_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16916864)))]; tensor norm0_2_weight = const()[name = tensor("norm0_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16921024)))]; tensor linear0_1_weight = const()[name = tensor("linear0_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16925184)))]; tensor linear0_2_weight = const()[name = tensor("linear0_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(33702464)))]; tensor norm1_1_bias = const()[name = tensor("norm1_1_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50479744)))]; tensor norm1_1_weight = const()[name = tensor("norm1_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50483904)))]; tensor attn1_in_proj_weight = const()[name = tensor("attn1_in_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(50488064)))]; tensor attn1_out_proj_weight = const()[name = tensor("attn1_out_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(63071040)))]; tensor norm1_2_bias = const()[name = tensor("norm1_2_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67265408)))]; tensor norm1_2_weight = const()[name = tensor("norm1_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67269568)))]; tensor linear1_1_weight = const()[name = tensor("linear1_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(67273728)))]; tensor linear1_2_weight = const()[name = tensor("linear1_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(84051008)))]; tensor norm2_1_bias = const()[name = tensor("norm2_1_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100828288)))]; tensor norm2_1_weight = const()[name = tensor("norm2_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100832448)))]; tensor attn2_in_proj_weight = const()[name = tensor("attn2_in_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(100836608)))]; tensor attn2_out_proj_weight = const()[name = tensor("attn2_out_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(113419584)))]; tensor norm2_2_bias = const()[name = tensor("norm2_2_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(117613952)))]; tensor norm2_2_weight = const()[name = tensor("norm2_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(117618112)))]; tensor linear2_1_weight = const()[name = tensor("linear2_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(117622272)))]; tensor linear2_2_weight = const()[name = tensor("linear2_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(134399552)))]; tensor norm3_1_bias = const()[name = tensor("norm3_1_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151176832)))]; tensor norm3_1_weight = const()[name = tensor("norm3_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151180992)))]; tensor attn3_in_proj_weight = const()[name = tensor("attn3_in_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(151185152)))]; tensor attn3_out_proj_weight = const()[name = tensor("attn3_out_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163768128)))]; tensor norm3_2_bias = const()[name = tensor("norm3_2_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167962496)))]; tensor norm3_2_weight = const()[name = tensor("norm3_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167966656)))]; tensor linear3_1_weight = const()[name = tensor("linear3_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167970816)))]; tensor linear3_2_weight = const()[name = tensor("linear3_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184748096)))]; tensor norm4_1_bias = const()[name = tensor("norm4_1_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201525376)))]; tensor norm4_1_weight = const()[name = tensor("norm4_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201529536)))]; tensor attn4_in_proj_weight = const()[name = tensor("attn4_in_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(201533696)))]; tensor attn4_out_proj_weight = const()[name = tensor("attn4_out_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(214116672)))]; tensor norm4_2_bias = const()[name = tensor("norm4_2_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218311040)))]; tensor norm4_2_weight = const()[name = tensor("norm4_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218315200)))]; tensor linear4_1_weight = const()[name = tensor("linear4_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(218319360)))]; tensor linear4_2_weight = const()[name = tensor("linear4_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(235096640)))]; tensor norm5_1_bias = const()[name = tensor("norm5_1_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(251873920)))]; tensor norm5_1_weight = const()[name = tensor("norm5_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(251878080)))]; tensor attn5_in_proj_weight = const()[name = tensor("attn5_in_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(251882240)))]; tensor attn5_out_proj_weight = const()[name = tensor("attn5_out_proj_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(264465216)))]; tensor norm5_2_bias = const()[name = tensor("norm5_2_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268659584)))]; tensor norm5_2_weight = const()[name = tensor("norm5_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268663744)))]; tensor linear5_1_weight = const()[name = tensor("linear5_1_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268667904)))]; tensor linear5_2_weight = const()[name = tensor("linear5_2_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(285445184)))]; tensor out_norm_bias = const()[name = tensor("out_norm_bias"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(302222464)))]; tensor out_norm_weight = const()[name = tensor("out_norm_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(302226624)))]; tensor out_eos_bias = const()[name = tensor("out_eos_bias"), val = tensor([-0x1.42p-2])]; tensor out_eos_weight = const()[name = tensor("out_eos_weight"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(302230784)))]; tensor var_54 = not_equal(x = sequence, y = sequence)[name = tensor("op_54")]; tensor expand_dims_0_axes_0 = const()[name = tensor("expand_dims_0_axes_0"), val = tensor([0, 1])]; tensor expand_dims_0 = expand_dims(axes = expand_dims_0_axes_0, x = bos_emb)[name = tensor("expand_dims_0")]; tensor input_1 = select(a = expand_dims_0, b = sequence, cond = var_54)[name = tensor("input_1")]; tensor linear_0_bias_0 = const()[name = tensor("linear_0_bias_0"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(302234944)))]; tensor input_3 = linear(bias = linear_0_bias_0, weight = input_linear_weight, x = input_1)[name = tensor("linear_0")]; tensor var_60 = const()[name = tensor("op_60"), val = tensor(0x1.4f8b58p-17)]; tensor x_1_axes_0 = const()[name = tensor("x_1_axes_0"), val = tensor([-1])]; tensor x_1 = layer_norm(axes = x_1_axes_0, beta = norm0_1_bias, epsilon = var_60, gamma = norm0_1_weight, x = input_3)[name = tensor("x_1")]; tensor linear_1_bias_0 = const()[name = tensor("linear_1_bias_0"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(302239104)))]; tensor var_92 = linear(bias = linear_1_bias_0, weight = attn0_in_proj_weight, x = x_1)[name = tensor("linear_1")]; tensor var_96 = const()[name = tensor("op_96"), val = tensor([1, 1, 3, 16, 64])]; tensor qkv_1 = reshape(shape = var_96, x = var_92)[name = tensor("qkv_1")]; tensor q_1_begin_0 = const()[name = tensor("q_1_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_1_end_0 = const()[name = tensor("q_1_end_0"), val = tensor([1, 1, 1, 16, 64])]; tensor q_1_end_mask_0 = const()[name = tensor("q_1_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_1_squeeze_mask_0 = const()[name = tensor("q_1_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_1 = slice_by_index(begin = q_1_begin_0, end = q_1_end_0, end_mask = q_1_end_mask_0, squeeze_mask = q_1_squeeze_mask_0, x = qkv_1)[name = tensor("q_1")]; tensor k_1_begin_0 = const()[name = tensor("k_1_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_1_end_0 = const()[name = tensor("k_1_end_0"), val = tensor([1, 1, 2, 16, 64])]; tensor k_1_end_mask_0 = const()[name = tensor("k_1_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_1_squeeze_mask_0 = const()[name = tensor("k_1_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_1 = slice_by_index(begin = k_1_begin_0, end = k_1_end_0, end_mask = k_1_end_mask_0, squeeze_mask = k_1_squeeze_mask_0, x = qkv_1)[name = tensor("k_1")]; tensor v_1_begin_0 = const()[name = tensor("v_1_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_1_end_0 = const()[name = tensor("v_1_end_0"), val = tensor([1, 1, 3, 16, 64])]; tensor v_1_end_mask_0 = const()[name = tensor("v_1_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_1_squeeze_mask_0 = const()[name = tensor("v_1_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_1 = slice_by_index(begin = v_1_begin_0, end = v_1_end_0, end_mask = v_1_end_mask_0, squeeze_mask = v_1_squeeze_mask_0, x = qkv_1)[name = tensor("v_1")]; tensor freqs_1 = const()[name = tensor("freqs_1"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(302251456)))]; tensor var_200 = const()[name = tensor("op_200"), val = tensor([1, 1, 1, 1])]; tensor ts_5 = reshape(shape = var_200, x = position0)[name = tensor("ts_5")]; tensor var_204 = const()[name = tensor("op_204"), val = tensor([1, 1, 16, 32, 2])]; tensor q_complex_1 = reshape(shape = var_204, x = q_1)[name = tensor("q_complex_1")]; tensor var_208 = const()[name = tensor("op_208"), val = tensor([1, 1, 16, 32, 2])]; tensor k_complex_1 = reshape(shape = var_208, x = k_1)[name = tensor("k_complex_1")]; tensor var_212_begin_0 = const()[name = tensor("op_212_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_212_end_0 = const()[name = tensor("op_212_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_212_end_mask_0 = const()[name = tensor("op_212_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_212_squeeze_mask_0 = const()[name = tensor("op_212_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_212 = slice_by_index(begin = var_212_begin_0, end = var_212_end_0, end_mask = var_212_end_mask_0, squeeze_mask = var_212_squeeze_mask_0, x = q_complex_1)[name = tensor("op_212")]; tensor var_220_begin_0 = const()[name = tensor("op_220_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_220_end_0 = const()[name = tensor("op_220_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_220_end_mask_0 = const()[name = tensor("op_220_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_220_squeeze_mask_0 = const()[name = tensor("op_220_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_220 = slice_by_index(begin = var_220_begin_0, end = var_220_end_0, end_mask = var_220_end_mask_0, squeeze_mask = var_220_squeeze_mask_0, x = q_complex_1)[name = tensor("op_220")]; tensor var_228_begin_0 = const()[name = tensor("op_228_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_228_end_0 = const()[name = tensor("op_228_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_228_end_mask_0 = const()[name = tensor("op_228_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_228_squeeze_mask_0 = const()[name = tensor("op_228_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_228 = slice_by_index(begin = var_228_begin_0, end = var_228_end_0, end_mask = var_228_end_mask_0, squeeze_mask = var_228_squeeze_mask_0, x = k_complex_1)[name = tensor("op_228")]; tensor var_236_begin_0 = const()[name = tensor("op_236_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_236_end_0 = const()[name = tensor("op_236_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_236_end_mask_0 = const()[name = tensor("op_236_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_236_squeeze_mask_0 = const()[name = tensor("op_236_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_236 = slice_by_index(begin = var_236_begin_0, end = var_236_end_0, end_mask = var_236_end_mask_0, squeeze_mask = var_236_squeeze_mask_0, x = k_complex_1)[name = tensor("op_236")]; tensor var_242 = mul(x = freqs_1, y = ts_5)[name = tensor("op_242")]; tensor rotr_1 = cos(x = var_242)[name = tensor("rotr_1")]; tensor roti_1 = sin(x = var_242)[name = tensor("roti_1")]; tensor var_246 = mul(x = var_212, y = rotr_1)[name = tensor("op_246")]; tensor var_247 = mul(x = var_220, y = roti_1)[name = tensor("op_247")]; tensor qor_1 = sub(x = var_246, y = var_247)[name = tensor("qor_1")]; tensor var_250 = mul(x = var_212, y = roti_1)[name = tensor("op_250")]; tensor var_251 = mul(x = var_220, y = rotr_1)[name = tensor("op_251")]; tensor qoi_1 = add(x = var_250, y = var_251)[name = tensor("qoi_1")]; tensor var_254 = mul(x = var_228, y = rotr_1)[name = tensor("op_254")]; tensor var_255 = mul(x = var_236, y = roti_1)[name = tensor("op_255")]; tensor kor_1 = sub(x = var_254, y = var_255)[name = tensor("kor_1")]; tensor var_258 = mul(x = var_228, y = roti_1)[name = tensor("op_258")]; tensor var_259 = mul(x = var_236, y = rotr_1)[name = tensor("op_259")]; tensor koi_1 = add(x = var_258, y = var_259)[name = tensor("koi_1")]; tensor qo_1_axis_0 = const()[name = tensor("qo_1_axis_0"), val = tensor(-1)]; tensor qo_1 = stack(axis = qo_1_axis_0, values = (qor_1, qoi_1))[name = tensor("qo_1")]; tensor ko_1_axis_0 = const()[name = tensor("ko_1_axis_0"), val = tensor(-1)]; tensor ko_1 = stack(axis = ko_1_axis_0, values = (kor_1, koi_1))[name = tensor("ko_1")]; tensor var_288 = const()[name = tensor("op_288"), val = tensor([1, 1, 16, 64])]; tensor q_3 = reshape(shape = var_288, x = qo_1)[name = tensor("q_3")]; tensor var_290 = const()[name = tensor("op_290"), val = tensor([1, 1, 16, 64])]; tensor k_3 = reshape(shape = var_290, x = ko_1)[name = tensor("k_3")]; tensor _inversed_312_y_0 = const()[name = tensor("_inversed_312_y_0"), val = tensor(0x1p-9)]; tensor _inversed_312 = mul(x = ts_5, y = _inversed_312_y_0)[name = tensor("_inversed_312")]; tensor var_313 = floor(x = _inversed_312)[name = tensor("op_313")]; tensor var_314 = const()[name = tensor("op_314"), val = tensor(0x1p+9)]; tensor var_315 = mul(x = var_313, y = var_314)[name = tensor("op_315")]; tensor write_indices_float_3 = sub(x = ts_5, y = var_315)[name = tensor("write_indices_float_3")]; tensor var_322_dtype_0 = const()[name = tensor("op_322_dtype_0"), val = tensor("int32")]; tensor write_indices_1_reps_0 = const()[name = tensor("write_indices_1_reps_0"), val = tensor([1, 1, 16, 64])]; tensor var_322 = cast(dtype = var_322_dtype_0, x = write_indices_float_3)[name = tensor("cast_113")]; tensor write_indices_1 = tile(reps = write_indices_1_reps_0, x = var_322)[name = tensor("write_indices_1")]; tensor var_330_begin_0 = const()[name = tensor("op_330_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_330_end_0 = const()[name = tensor("op_330_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor var_330_end_mask_0 = const()[name = tensor("op_330_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_330_squeeze_mask_0 = const()[name = tensor("op_330_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_330 = slice_by_index(begin = var_330_begin_0, end = var_330_end_0, end_mask = var_330_end_mask_0, squeeze_mask = var_330_squeeze_mask_0, x = cache0)[name = tensor("op_330")]; tensor var_332_axis_0 = const()[name = tensor("op_332_axis_0"), val = tensor(1)]; tensor var_332_mode_0 = const()[name = tensor("op_332_mode_0"), val = tensor("update")]; tensor var_332_validate_indices_0 = const()[name = tensor("op_332_validate_indices_0"), val = tensor(false)]; tensor var_332 = scatter_along_axis(axis = var_332_axis_0, data = var_330, indices = write_indices_1, mode = var_332_mode_0, updates = k_3, validate_indices = var_332_validate_indices_0)[name = tensor("op_332")]; tensor concat_2 = const()[name = tensor("concat_2"), val = tensor([0, 0, 0, 0, 0])]; tensor concat_3 = const()[name = tensor("concat_3"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_1_internal_tensor_assign_1_stride_0 = const()[name = tensor("new_cache_1_internal_tensor_assign_1_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_1_internal_tensor_assign_1_begin_mask_0 = const()[name = tensor("new_cache_1_internal_tensor_assign_1_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_1_internal_tensor_assign_1_end_mask_0 = const()[name = tensor("new_cache_1_internal_tensor_assign_1_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_1_internal_tensor_assign_1_squeeze_mask_0 = const()[name = tensor("new_cache_1_internal_tensor_assign_1_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_12 = const()[name = tensor("shape_12"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_0 = const()[name = tensor("reduce_prod_0"), val = tensor(1048576)]; tensor range_1d_0_start_0 = const()[name = tensor("range_1d_0_start_0"), val = tensor(0)]; tensor range_1d_0_step_0 = const()[name = tensor("range_1d_0_step_0"), val = tensor(1)]; tensor range_1d_0 = range_1d(end = reduce_prod_0, start = range_1d_0_start_0, step = range_1d_0_step_0)[name = tensor("range_1d_0")]; tensor reshape_0 = reshape(shape = shape_12, x = range_1d_0)[name = tensor("reshape_0")]; tensor slice_by_index_0 = slice_by_index(begin = concat_2, begin_mask = new_cache_1_internal_tensor_assign_1_begin_mask_0, end = concat_3, end_mask = new_cache_1_internal_tensor_assign_1_end_mask_0, squeeze_mask = new_cache_1_internal_tensor_assign_1_squeeze_mask_0, stride = new_cache_1_internal_tensor_assign_1_stride_0, x = reshape_0)[name = tensor("slice_by_index_0")]; tensor reshape_1_shape_0 = const()[name = tensor("reshape_1_shape_0"), val = tensor([-1])]; tensor reshape_1 = reshape(shape = reshape_1_shape_0, x = slice_by_index_0)[name = tensor("reshape_1")]; tensor reshape_2_shape_0 = const()[name = tensor("reshape_2_shape_0"), val = tensor([-1])]; tensor reshape_2 = reshape(shape = reshape_2_shape_0, x = var_332)[name = tensor("reshape_2")]; tensor reshape_3_shape_0 = const()[name = tensor("reshape_3_shape_0"), val = tensor([-1])]; tensor reshape_3 = reshape(shape = reshape_3_shape_0, x = cache0)[name = tensor("reshape_3")]; tensor scatter_0_mode_0 = const()[name = tensor("scatter_0_mode_0"), val = tensor("update")]; tensor scatter_0_axis_0 = const()[name = tensor("scatter_0_axis_0"), val = tensor(0)]; tensor scatter_0_validate_indices_0 = const()[name = tensor("scatter_0_validate_indices_0"), val = tensor(false)]; tensor scatter_0 = scatter(axis = scatter_0_axis_0, data = reshape_3, indices = reshape_1, mode = scatter_0_mode_0, updates = reshape_2, validate_indices = scatter_0_validate_indices_0)[name = tensor("scatter_0")]; tensor reshape_4 = reshape(shape = shape_12, x = scatter_0)[name = tensor("reshape_4")]; tensor var_340_begin_0 = const()[name = tensor("op_340_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor var_340_end_0 = const()[name = tensor("op_340_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor var_340_end_mask_0 = const()[name = tensor("op_340_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_340_squeeze_mask_0 = const()[name = tensor("op_340_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_340 = slice_by_index(begin = var_340_begin_0, end = var_340_end_0, end_mask = var_340_end_mask_0, squeeze_mask = var_340_squeeze_mask_0, x = reshape_4)[name = tensor("op_340")]; tensor var_342_axis_0 = const()[name = tensor("op_342_axis_0"), val = tensor(1)]; tensor var_342_mode_0 = const()[name = tensor("op_342_mode_0"), val = tensor("update")]; tensor var_342_validate_indices_0 = const()[name = tensor("op_342_validate_indices_0"), val = tensor(false)]; tensor var_342 = scatter_along_axis(axis = var_342_axis_0, data = var_340, indices = write_indices_1, mode = var_342_mode_0, updates = v_1, validate_indices = var_342_validate_indices_0)[name = tensor("op_342")]; tensor concat_4 = const()[name = tensor("concat_4"), val = tensor([1, 0, 0, 0, 0])]; tensor concat_5 = const()[name = tensor("concat_5"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_1_internal_tensor_assign_2_stride_0 = const()[name = tensor("new_cache_1_internal_tensor_assign_2_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_1_internal_tensor_assign_2_begin_mask_0 = const()[name = tensor("new_cache_1_internal_tensor_assign_2_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_1_internal_tensor_assign_2_end_mask_0 = const()[name = tensor("new_cache_1_internal_tensor_assign_2_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_1_internal_tensor_assign_2_squeeze_mask_0 = const()[name = tensor("new_cache_1_internal_tensor_assign_2_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_13 = const()[name = tensor("shape_13"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_1 = const()[name = tensor("reduce_prod_1"), val = tensor(1048576)]; tensor range_1d_1_start_0 = const()[name = tensor("range_1d_1_start_0"), val = tensor(0)]; tensor range_1d_1_step_0 = const()[name = tensor("range_1d_1_step_0"), val = tensor(1)]; tensor range_1d_1 = range_1d(end = reduce_prod_1, start = range_1d_1_start_0, step = range_1d_1_step_0)[name = tensor("range_1d_1")]; tensor reshape_5 = reshape(shape = shape_13, x = range_1d_1)[name = tensor("reshape_5")]; tensor slice_by_index_1 = slice_by_index(begin = concat_4, begin_mask = new_cache_1_internal_tensor_assign_2_begin_mask_0, end = concat_5, end_mask = new_cache_1_internal_tensor_assign_2_end_mask_0, squeeze_mask = new_cache_1_internal_tensor_assign_2_squeeze_mask_0, stride = new_cache_1_internal_tensor_assign_2_stride_0, x = reshape_5)[name = tensor("slice_by_index_1")]; tensor reshape_6_shape_0 = const()[name = tensor("reshape_6_shape_0"), val = tensor([-1])]; tensor reshape_6 = reshape(shape = reshape_6_shape_0, x = slice_by_index_1)[name = tensor("reshape_6")]; tensor reshape_7_shape_0 = const()[name = tensor("reshape_7_shape_0"), val = tensor([-1])]; tensor reshape_7 = reshape(shape = reshape_7_shape_0, x = var_342)[name = tensor("reshape_7")]; tensor reshape_8_shape_0 = const()[name = tensor("reshape_8_shape_0"), val = tensor([-1])]; tensor reshape_8 = reshape(shape = reshape_8_shape_0, x = reshape_4)[name = tensor("reshape_8")]; tensor scatter_1_mode_0 = const()[name = tensor("scatter_1_mode_0"), val = tensor("update")]; tensor scatter_1_axis_0 = const()[name = tensor("scatter_1_axis_0"), val = tensor(0)]; tensor scatter_1_validate_indices_0 = const()[name = tensor("scatter_1_validate_indices_0"), val = tensor(false)]; tensor scatter_1 = scatter(axis = scatter_1_axis_0, data = reshape_8, indices = reshape_6, mode = scatter_1_mode_0, updates = reshape_7, validate_indices = scatter_1_validate_indices_0)[name = tensor("scatter_1")]; tensor new_cache_1_internal_tensor_assign_2 = reshape(shape = shape_13, x = scatter_1)[name = tensor("reshape_9")]; tensor keys_1_begin_0 = const()[name = tensor("keys_1_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor keys_1_end_0 = const()[name = tensor("keys_1_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor keys_1_end_mask_0 = const()[name = tensor("keys_1_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor keys_1_squeeze_mask_0 = const()[name = tensor("keys_1_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor keys_1 = slice_by_index(begin = keys_1_begin_0, end = keys_1_end_0, end_mask = keys_1_end_mask_0, squeeze_mask = keys_1_squeeze_mask_0, x = new_cache_1_internal_tensor_assign_2)[name = tensor("keys_1")]; tensor values_1_begin_0 = const()[name = tensor("values_1_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor values_1_end_0 = const()[name = tensor("values_1_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor values_1_end_mask_0 = const()[name = tensor("values_1_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor values_1_squeeze_mask_0 = const()[name = tensor("values_1_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor values_1 = slice_by_index(begin = values_1_begin_0, end = values_1_end_0, end_mask = values_1_end_mask_0, squeeze_mask = values_1_squeeze_mask_0, x = new_cache_1_internal_tensor_assign_2)[name = tensor("values_1")]; tensor var_354 = not_equal(x = keys_1, y = keys_1)[name = tensor("op_354")]; tensor var_360 = const()[name = tensor("op_360"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(302251648)))]; tensor keys_3 = select(a = var_360, b = keys_1, cond = var_354)[name = tensor("keys_3")]; tensor var_362 = not_equal(x = values_1, y = values_1)[name = tensor("op_362")]; tensor values_3 = select(a = var_360, b = values_1, cond = var_362)[name = tensor("values_3")]; tensor var_386 = const()[name = tensor("op_386"), val = tensor([0, 2, 1, 3])]; tensor var_399 = const()[name = tensor("op_399"), val = tensor([1, 1, 1])]; tensor var_400 = reshape(shape = var_399, x = position0)[name = tensor("op_400")]; tensor var_417 = const()[name = tensor("op_417"), val = tensor(0x1p+0)]; tensor valid_len_1 = add(x = var_400, y = var_417)[name = tensor("valid_len_1")]; tensor k_positions_1_promoted = const()[name = tensor("k_positions_1_promoted"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304348864)))]; tensor valid_mask_1 = less(x = k_positions_1_promoted, y = valid_len_1)[name = tensor("valid_mask_1")]; tensor causal_mask_1 = less_equal(x = k_positions_1_promoted, y = var_400)[name = tensor("causal_mask_1")]; tensor attn_mask_1 = logical_and(x = valid_mask_1, y = causal_mask_1)[name = tensor("attn_mask_1")]; tensor attn_mask_3_axes_0 = const()[name = tensor("attn_mask_3_axes_0"), val = tensor([1])]; tensor attn_mask_3 = expand_dims(axes = attn_mask_3_axes_0, x = attn_mask_1)[name = tensor("attn_mask_3")]; tensor var_429 = const()[name = tensor("op_429"), val = tensor([0x1.fffe5cp-4])]; tensor var_435_transpose_x_0 = const()[name = tensor("op_435_transpose_x_0"), val = tensor(false)]; tensor var_435_transpose_y_0 = const()[name = tensor("op_435_transpose_y_0"), val = tensor(false)]; tensor transpose_18_perm_0 = const()[name = tensor("transpose_18_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_19_perm_0 = const()[name = tensor("transpose_19_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_19 = transpose(perm = transpose_19_perm_0, x = keys_3)[name = tensor("transpose_51")]; tensor transpose_18 = transpose(perm = transpose_18_perm_0, x = q_3)[name = tensor("transpose_52")]; tensor var_435 = matmul(transpose_x = var_435_transpose_x_0, transpose_y = var_435_transpose_y_0, x = transpose_18, y = transpose_19)[name = tensor("op_435")]; tensor attn_weights_1 = mul(x = var_435, y = var_429)[name = tensor("attn_weights_1")]; tensor var_437 = logical_not(x = attn_mask_3)[name = tensor("op_437")]; tensor var_438 = const()[name = tensor("op_438"), val = tensor(-0x1.ff933cp+127)]; tensor attn_weights_3 = select(a = var_438, b = attn_weights_1, cond = var_437)[name = tensor("attn_weights_3")]; tensor var_440 = const()[name = tensor("op_440"), val = tensor(-1)]; tensor attn_weights_5 = softmax(axis = var_440, x = attn_weights_3)[name = tensor("attn_weights_5")]; tensor attn_output_1_transpose_x_0 = const()[name = tensor("attn_output_1_transpose_x_0"), val = tensor(false)]; tensor attn_output_1_transpose_y_0 = const()[name = tensor("attn_output_1_transpose_y_0"), val = tensor(false)]; tensor values_5 = transpose(perm = var_386, x = values_3)[name = tensor("transpose_53")]; tensor attn_output_1 = matmul(transpose_x = attn_output_1_transpose_x_0, transpose_y = attn_output_1_transpose_y_0, x = attn_weights_5, y = values_5)[name = tensor("attn_output_1")]; tensor var_448 = const()[name = tensor("op_448"), val = tensor([0, 2, 1, 3])]; tensor var_451 = const()[name = tensor("op_451"), val = tensor([1, 1, 1024])]; tensor var_449 = transpose(perm = var_448, x = attn_output_1)[name = tensor("transpose_50")]; tensor input_5 = reshape(shape = var_451, x = var_449)[name = tensor("input_5")]; tensor attn_out_1 = linear(bias = linear_0_bias_0, weight = attn0_out_proj_weight, x = input_5)[name = tensor("linear_2")]; tensor var_457 = const()[name = tensor("op_457"), val = tensor(0x1p+0)]; tensor var_458 = add(x = position0, y = var_457)[name = tensor("op_458")]; tensor input_7 = add(x = input_3, y = attn_out_1)[name = tensor("input_7")]; tensor var_462 = const()[name = tensor("op_462"), val = tensor(0x1.4f8b58p-17)]; tensor input_9_axes_0 = const()[name = tensor("input_9_axes_0"), val = tensor([-1])]; tensor input_9 = layer_norm(axes = input_9_axes_0, beta = norm0_2_bias, epsilon = var_462, gamma = norm0_2_weight, x = input_7)[name = tensor("input_9")]; tensor linear_3_bias_0 = const()[name = tensor("linear_3_bias_0"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304350976)))]; tensor var_470 = linear(bias = linear_3_bias_0, weight = linear0_1_weight, x = input_9)[name = tensor("linear_3")]; tensor input_11_mode_0 = const()[name = tensor("input_11_mode_0"), val = tensor("EXACT")]; tensor input_11 = gelu(mode = input_11_mode_0, x = var_470)[name = tensor("input_11")]; tensor ffn_out_1 = linear(bias = linear_0_bias_0, weight = linear0_2_weight, x = input_11)[name = tensor("linear_4")]; tensor input_13 = add(x = input_7, y = ffn_out_1)[name = tensor("input_13")]; tensor var_479 = const()[name = tensor("op_479"), val = tensor(0x1.4f8b58p-17)]; tensor x_3_axes_0 = const()[name = tensor("x_3_axes_0"), val = tensor([-1])]; tensor x_3 = layer_norm(axes = x_3_axes_0, beta = norm1_1_bias, epsilon = var_479, gamma = norm1_1_weight, x = input_13)[name = tensor("x_3")]; tensor var_511 = linear(bias = linear_1_bias_0, weight = attn1_in_proj_weight, x = x_3)[name = tensor("linear_5")]; tensor var_515 = const()[name = tensor("op_515"), val = tensor([1, 1, 3, 16, 64])]; tensor qkv_3 = reshape(shape = var_515, x = var_511)[name = tensor("qkv_3")]; tensor q_7_begin_0 = const()[name = tensor("q_7_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_7_end_0 = const()[name = tensor("q_7_end_0"), val = tensor([1, 1, 1, 16, 64])]; tensor q_7_end_mask_0 = const()[name = tensor("q_7_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_7_squeeze_mask_0 = const()[name = tensor("q_7_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_7 = slice_by_index(begin = q_7_begin_0, end = q_7_end_0, end_mask = q_7_end_mask_0, squeeze_mask = q_7_squeeze_mask_0, x = qkv_3)[name = tensor("q_7")]; tensor k_5_begin_0 = const()[name = tensor("k_5_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_5_end_0 = const()[name = tensor("k_5_end_0"), val = tensor([1, 1, 2, 16, 64])]; tensor k_5_end_mask_0 = const()[name = tensor("k_5_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_5_squeeze_mask_0 = const()[name = tensor("k_5_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_5 = slice_by_index(begin = k_5_begin_0, end = k_5_end_0, end_mask = k_5_end_mask_0, squeeze_mask = k_5_squeeze_mask_0, x = qkv_3)[name = tensor("k_5")]; tensor v_3_begin_0 = const()[name = tensor("v_3_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_3_end_0 = const()[name = tensor("v_3_end_0"), val = tensor([1, 1, 3, 16, 64])]; tensor v_3_end_mask_0 = const()[name = tensor("v_3_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_3_squeeze_mask_0 = const()[name = tensor("v_3_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_3 = slice_by_index(begin = v_3_begin_0, end = v_3_end_0, end_mask = v_3_end_mask_0, squeeze_mask = v_3_squeeze_mask_0, x = qkv_3)[name = tensor("v_3")]; tensor freqs_3 = const()[name = tensor("freqs_3"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304367424)))]; tensor var_619 = const()[name = tensor("op_619"), val = tensor([1, 1, 1, 1])]; tensor ts_11 = reshape(shape = var_619, x = position1)[name = tensor("ts_11")]; tensor var_623 = const()[name = tensor("op_623"), val = tensor([1, 1, 16, 32, 2])]; tensor q_complex_3 = reshape(shape = var_623, x = q_7)[name = tensor("q_complex_3")]; tensor var_627 = const()[name = tensor("op_627"), val = tensor([1, 1, 16, 32, 2])]; tensor k_complex_3 = reshape(shape = var_627, x = k_5)[name = tensor("k_complex_3")]; tensor var_631_begin_0 = const()[name = tensor("op_631_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_631_end_0 = const()[name = tensor("op_631_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_631_end_mask_0 = const()[name = tensor("op_631_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_631_squeeze_mask_0 = const()[name = tensor("op_631_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_631 = slice_by_index(begin = var_631_begin_0, end = var_631_end_0, end_mask = var_631_end_mask_0, squeeze_mask = var_631_squeeze_mask_0, x = q_complex_3)[name = tensor("op_631")]; tensor var_639_begin_0 = const()[name = tensor("op_639_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_639_end_0 = const()[name = tensor("op_639_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_639_end_mask_0 = const()[name = tensor("op_639_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_639_squeeze_mask_0 = const()[name = tensor("op_639_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_639 = slice_by_index(begin = var_639_begin_0, end = var_639_end_0, end_mask = var_639_end_mask_0, squeeze_mask = var_639_squeeze_mask_0, x = q_complex_3)[name = tensor("op_639")]; tensor var_647_begin_0 = const()[name = tensor("op_647_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_647_end_0 = const()[name = tensor("op_647_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_647_end_mask_0 = const()[name = tensor("op_647_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_647_squeeze_mask_0 = const()[name = tensor("op_647_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_647 = slice_by_index(begin = var_647_begin_0, end = var_647_end_0, end_mask = var_647_end_mask_0, squeeze_mask = var_647_squeeze_mask_0, x = k_complex_3)[name = tensor("op_647")]; tensor var_655_begin_0 = const()[name = tensor("op_655_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_655_end_0 = const()[name = tensor("op_655_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_655_end_mask_0 = const()[name = tensor("op_655_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_655_squeeze_mask_0 = const()[name = tensor("op_655_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_655 = slice_by_index(begin = var_655_begin_0, end = var_655_end_0, end_mask = var_655_end_mask_0, squeeze_mask = var_655_squeeze_mask_0, x = k_complex_3)[name = tensor("op_655")]; tensor var_661 = mul(x = freqs_3, y = ts_11)[name = tensor("op_661")]; tensor rotr_3 = cos(x = var_661)[name = tensor("rotr_3")]; tensor roti_3 = sin(x = var_661)[name = tensor("roti_3")]; tensor var_665 = mul(x = var_631, y = rotr_3)[name = tensor("op_665")]; tensor var_666 = mul(x = var_639, y = roti_3)[name = tensor("op_666")]; tensor qor_5 = sub(x = var_665, y = var_666)[name = tensor("qor_5")]; tensor var_669 = mul(x = var_631, y = roti_3)[name = tensor("op_669")]; tensor var_670 = mul(x = var_639, y = rotr_3)[name = tensor("op_670")]; tensor qoi_5 = add(x = var_669, y = var_670)[name = tensor("qoi_5")]; tensor var_673 = mul(x = var_647, y = rotr_3)[name = tensor("op_673")]; tensor var_674 = mul(x = var_655, y = roti_3)[name = tensor("op_674")]; tensor kor_5 = sub(x = var_673, y = var_674)[name = tensor("kor_5")]; tensor var_677 = mul(x = var_647, y = roti_3)[name = tensor("op_677")]; tensor var_678 = mul(x = var_655, y = rotr_3)[name = tensor("op_678")]; tensor koi_5 = add(x = var_677, y = var_678)[name = tensor("koi_5")]; tensor qo_3_axis_0 = const()[name = tensor("qo_3_axis_0"), val = tensor(-1)]; tensor qo_3 = stack(axis = qo_3_axis_0, values = (qor_5, qoi_5))[name = tensor("qo_3")]; tensor ko_3_axis_0 = const()[name = tensor("ko_3_axis_0"), val = tensor(-1)]; tensor ko_3 = stack(axis = ko_3_axis_0, values = (kor_5, koi_5))[name = tensor("ko_3")]; tensor var_707 = const()[name = tensor("op_707"), val = tensor([1, 1, 16, 64])]; tensor q_9 = reshape(shape = var_707, x = qo_3)[name = tensor("q_9")]; tensor var_709 = const()[name = tensor("op_709"), val = tensor([1, 1, 16, 64])]; tensor k_7 = reshape(shape = var_709, x = ko_3)[name = tensor("k_7")]; tensor _inversed_731_y_0 = const()[name = tensor("_inversed_731_y_0"), val = tensor(0x1p-9)]; tensor _inversed_731 = mul(x = ts_11, y = _inversed_731_y_0)[name = tensor("_inversed_731")]; tensor var_732 = floor(x = _inversed_731)[name = tensor("op_732")]; tensor var_733 = const()[name = tensor("op_733"), val = tensor(0x1p+9)]; tensor var_734 = mul(x = var_732, y = var_733)[name = tensor("op_734")]; tensor write_indices_float_7 = sub(x = ts_11, y = var_734)[name = tensor("write_indices_float_7")]; tensor var_741_dtype_0 = const()[name = tensor("op_741_dtype_0"), val = tensor("int32")]; tensor write_indices_3_reps_0 = const()[name = tensor("write_indices_3_reps_0"), val = tensor([1, 1, 16, 64])]; tensor var_741 = cast(dtype = var_741_dtype_0, x = write_indices_float_7)[name = tensor("cast_112")]; tensor write_indices_3 = tile(reps = write_indices_3_reps_0, x = var_741)[name = tensor("write_indices_3")]; tensor var_749_begin_0 = const()[name = tensor("op_749_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_749_end_0 = const()[name = tensor("op_749_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor var_749_end_mask_0 = const()[name = tensor("op_749_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_749_squeeze_mask_0 = const()[name = tensor("op_749_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_749 = slice_by_index(begin = var_749_begin_0, end = var_749_end_0, end_mask = var_749_end_mask_0, squeeze_mask = var_749_squeeze_mask_0, x = cache1)[name = tensor("op_749")]; tensor var_751_axis_0 = const()[name = tensor("op_751_axis_0"), val = tensor(1)]; tensor var_751_mode_0 = const()[name = tensor("op_751_mode_0"), val = tensor("update")]; tensor var_751_validate_indices_0 = const()[name = tensor("op_751_validate_indices_0"), val = tensor(false)]; tensor var_751 = scatter_along_axis(axis = var_751_axis_0, data = var_749, indices = write_indices_3, mode = var_751_mode_0, updates = k_7, validate_indices = var_751_validate_indices_0)[name = tensor("op_751")]; tensor concat_9 = const()[name = tensor("concat_9"), val = tensor([0, 0, 0, 0, 0])]; tensor concat_10 = const()[name = tensor("concat_10"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_3_internal_tensor_assign_1_stride_0 = const()[name = tensor("new_cache_3_internal_tensor_assign_1_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_3_internal_tensor_assign_1_begin_mask_0 = const()[name = tensor("new_cache_3_internal_tensor_assign_1_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_3_internal_tensor_assign_1_end_mask_0 = const()[name = tensor("new_cache_3_internal_tensor_assign_1_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_3_internal_tensor_assign_1_squeeze_mask_0 = const()[name = tensor("new_cache_3_internal_tensor_assign_1_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_14 = const()[name = tensor("shape_14"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_2 = const()[name = tensor("reduce_prod_2"), val = tensor(1048576)]; tensor range_1d_2_start_0 = const()[name = tensor("range_1d_2_start_0"), val = tensor(0)]; tensor range_1d_2_step_0 = const()[name = tensor("range_1d_2_step_0"), val = tensor(1)]; tensor range_1d_2 = range_1d(end = reduce_prod_2, start = range_1d_2_start_0, step = range_1d_2_step_0)[name = tensor("range_1d_2")]; tensor reshape_10 = reshape(shape = shape_14, x = range_1d_2)[name = tensor("reshape_10")]; tensor slice_by_index_2 = slice_by_index(begin = concat_9, begin_mask = new_cache_3_internal_tensor_assign_1_begin_mask_0, end = concat_10, end_mask = new_cache_3_internal_tensor_assign_1_end_mask_0, squeeze_mask = new_cache_3_internal_tensor_assign_1_squeeze_mask_0, stride = new_cache_3_internal_tensor_assign_1_stride_0, x = reshape_10)[name = tensor("slice_by_index_2")]; tensor reshape_11_shape_0 = const()[name = tensor("reshape_11_shape_0"), val = tensor([-1])]; tensor reshape_11 = reshape(shape = reshape_11_shape_0, x = slice_by_index_2)[name = tensor("reshape_11")]; tensor reshape_12_shape_0 = const()[name = tensor("reshape_12_shape_0"), val = tensor([-1])]; tensor reshape_12 = reshape(shape = reshape_12_shape_0, x = var_751)[name = tensor("reshape_12")]; tensor reshape_13_shape_0 = const()[name = tensor("reshape_13_shape_0"), val = tensor([-1])]; tensor reshape_13 = reshape(shape = reshape_13_shape_0, x = cache1)[name = tensor("reshape_13")]; tensor scatter_2_mode_0 = const()[name = tensor("scatter_2_mode_0"), val = tensor("update")]; tensor scatter_2_axis_0 = const()[name = tensor("scatter_2_axis_0"), val = tensor(0)]; tensor scatter_2_validate_indices_0 = const()[name = tensor("scatter_2_validate_indices_0"), val = tensor(false)]; tensor scatter_2 = scatter(axis = scatter_2_axis_0, data = reshape_13, indices = reshape_11, mode = scatter_2_mode_0, updates = reshape_12, validate_indices = scatter_2_validate_indices_0)[name = tensor("scatter_2")]; tensor reshape_14 = reshape(shape = shape_14, x = scatter_2)[name = tensor("reshape_14")]; tensor var_759_begin_0 = const()[name = tensor("op_759_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor var_759_end_0 = const()[name = tensor("op_759_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor var_759_end_mask_0 = const()[name = tensor("op_759_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_759_squeeze_mask_0 = const()[name = tensor("op_759_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_759 = slice_by_index(begin = var_759_begin_0, end = var_759_end_0, end_mask = var_759_end_mask_0, squeeze_mask = var_759_squeeze_mask_0, x = reshape_14)[name = tensor("op_759")]; tensor var_761_axis_0 = const()[name = tensor("op_761_axis_0"), val = tensor(1)]; tensor var_761_mode_0 = const()[name = tensor("op_761_mode_0"), val = tensor("update")]; tensor var_761_validate_indices_0 = const()[name = tensor("op_761_validate_indices_0"), val = tensor(false)]; tensor var_761 = scatter_along_axis(axis = var_761_axis_0, data = var_759, indices = write_indices_3, mode = var_761_mode_0, updates = v_3, validate_indices = var_761_validate_indices_0)[name = tensor("op_761")]; tensor concat_11 = const()[name = tensor("concat_11"), val = tensor([1, 0, 0, 0, 0])]; tensor concat_12 = const()[name = tensor("concat_12"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_3_internal_tensor_assign_2_stride_0 = const()[name = tensor("new_cache_3_internal_tensor_assign_2_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_3_internal_tensor_assign_2_begin_mask_0 = const()[name = tensor("new_cache_3_internal_tensor_assign_2_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_3_internal_tensor_assign_2_end_mask_0 = const()[name = tensor("new_cache_3_internal_tensor_assign_2_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_3_internal_tensor_assign_2_squeeze_mask_0 = const()[name = tensor("new_cache_3_internal_tensor_assign_2_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_15 = const()[name = tensor("shape_15"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_3 = const()[name = tensor("reduce_prod_3"), val = tensor(1048576)]; tensor range_1d_3_start_0 = const()[name = tensor("range_1d_3_start_0"), val = tensor(0)]; tensor range_1d_3_step_0 = const()[name = tensor("range_1d_3_step_0"), val = tensor(1)]; tensor range_1d_3 = range_1d(end = reduce_prod_3, start = range_1d_3_start_0, step = range_1d_3_step_0)[name = tensor("range_1d_3")]; tensor reshape_15 = reshape(shape = shape_15, x = range_1d_3)[name = tensor("reshape_15")]; tensor slice_by_index_3 = slice_by_index(begin = concat_11, begin_mask = new_cache_3_internal_tensor_assign_2_begin_mask_0, end = concat_12, end_mask = new_cache_3_internal_tensor_assign_2_end_mask_0, squeeze_mask = new_cache_3_internal_tensor_assign_2_squeeze_mask_0, stride = new_cache_3_internal_tensor_assign_2_stride_0, x = reshape_15)[name = tensor("slice_by_index_3")]; tensor reshape_16_shape_0 = const()[name = tensor("reshape_16_shape_0"), val = tensor([-1])]; tensor reshape_16 = reshape(shape = reshape_16_shape_0, x = slice_by_index_3)[name = tensor("reshape_16")]; tensor reshape_17_shape_0 = const()[name = tensor("reshape_17_shape_0"), val = tensor([-1])]; tensor reshape_17 = reshape(shape = reshape_17_shape_0, x = var_761)[name = tensor("reshape_17")]; tensor reshape_18_shape_0 = const()[name = tensor("reshape_18_shape_0"), val = tensor([-1])]; tensor reshape_18 = reshape(shape = reshape_18_shape_0, x = reshape_14)[name = tensor("reshape_18")]; tensor scatter_3_mode_0 = const()[name = tensor("scatter_3_mode_0"), val = tensor("update")]; tensor scatter_3_axis_0 = const()[name = tensor("scatter_3_axis_0"), val = tensor(0)]; tensor scatter_3_validate_indices_0 = const()[name = tensor("scatter_3_validate_indices_0"), val = tensor(false)]; tensor scatter_3 = scatter(axis = scatter_3_axis_0, data = reshape_18, indices = reshape_16, mode = scatter_3_mode_0, updates = reshape_17, validate_indices = scatter_3_validate_indices_0)[name = tensor("scatter_3")]; tensor new_cache_3_internal_tensor_assign_2 = reshape(shape = shape_15, x = scatter_3)[name = tensor("reshape_19")]; tensor keys_7_begin_0 = const()[name = tensor("keys_7_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor keys_7_end_0 = const()[name = tensor("keys_7_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor keys_7_end_mask_0 = const()[name = tensor("keys_7_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor keys_7_squeeze_mask_0 = const()[name = tensor("keys_7_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor keys_7 = slice_by_index(begin = keys_7_begin_0, end = keys_7_end_0, end_mask = keys_7_end_mask_0, squeeze_mask = keys_7_squeeze_mask_0, x = new_cache_3_internal_tensor_assign_2)[name = tensor("keys_7")]; tensor values_7_begin_0 = const()[name = tensor("values_7_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor values_7_end_0 = const()[name = tensor("values_7_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor values_7_end_mask_0 = const()[name = tensor("values_7_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor values_7_squeeze_mask_0 = const()[name = tensor("values_7_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor values_7 = slice_by_index(begin = values_7_begin_0, end = values_7_end_0, end_mask = values_7_end_mask_0, squeeze_mask = values_7_squeeze_mask_0, x = new_cache_3_internal_tensor_assign_2)[name = tensor("values_7")]; tensor var_773 = not_equal(x = keys_7, y = keys_7)[name = tensor("op_773")]; tensor keys_9 = select(a = var_360, b = keys_7, cond = var_773)[name = tensor("keys_9")]; tensor var_781 = not_equal(x = values_7, y = values_7)[name = tensor("op_781")]; tensor values_9 = select(a = var_360, b = values_7, cond = var_781)[name = tensor("values_9")]; tensor var_805 = const()[name = tensor("op_805"), val = tensor([0, 2, 1, 3])]; tensor var_818 = const()[name = tensor("op_818"), val = tensor([1, 1, 1])]; tensor var_819 = reshape(shape = var_818, x = position1)[name = tensor("op_819")]; tensor var_836 = const()[name = tensor("op_836"), val = tensor(0x1p+0)]; tensor valid_len_3 = add(x = var_819, y = var_836)[name = tensor("valid_len_3")]; tensor valid_mask_3 = less(x = k_positions_1_promoted, y = valid_len_3)[name = tensor("valid_mask_3")]; tensor causal_mask_3 = less_equal(x = k_positions_1_promoted, y = var_819)[name = tensor("causal_mask_3")]; tensor attn_mask_5 = logical_and(x = valid_mask_3, y = causal_mask_3)[name = tensor("attn_mask_5")]; tensor attn_mask_7_axes_0 = const()[name = tensor("attn_mask_7_axes_0"), val = tensor([1])]; tensor attn_mask_7 = expand_dims(axes = attn_mask_7_axes_0, x = attn_mask_5)[name = tensor("attn_mask_7")]; tensor var_848 = const()[name = tensor("op_848"), val = tensor([0x1.fffe5cp-4])]; tensor var_854_transpose_x_0 = const()[name = tensor("op_854_transpose_x_0"), val = tensor(false)]; tensor var_854_transpose_y_0 = const()[name = tensor("op_854_transpose_y_0"), val = tensor(false)]; tensor transpose_20_perm_0 = const()[name = tensor("transpose_20_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_21_perm_0 = const()[name = tensor("transpose_21_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_21 = transpose(perm = transpose_21_perm_0, x = keys_9)[name = tensor("transpose_47")]; tensor transpose_20 = transpose(perm = transpose_20_perm_0, x = q_9)[name = tensor("transpose_48")]; tensor var_854 = matmul(transpose_x = var_854_transpose_x_0, transpose_y = var_854_transpose_y_0, x = transpose_20, y = transpose_21)[name = tensor("op_854")]; tensor attn_weights_7 = mul(x = var_854, y = var_848)[name = tensor("attn_weights_7")]; tensor var_856 = logical_not(x = attn_mask_7)[name = tensor("op_856")]; tensor var_857 = const()[name = tensor("op_857"), val = tensor(-0x1.ff933cp+127)]; tensor attn_weights_9 = select(a = var_857, b = attn_weights_7, cond = var_856)[name = tensor("attn_weights_9")]; tensor var_859 = const()[name = tensor("op_859"), val = tensor(-1)]; tensor attn_weights_11 = softmax(axis = var_859, x = attn_weights_9)[name = tensor("attn_weights_11")]; tensor attn_output_3_transpose_x_0 = const()[name = tensor("attn_output_3_transpose_x_0"), val = tensor(false)]; tensor attn_output_3_transpose_y_0 = const()[name = tensor("attn_output_3_transpose_y_0"), val = tensor(false)]; tensor values_11 = transpose(perm = var_805, x = values_9)[name = tensor("transpose_49")]; tensor attn_output_3 = matmul(transpose_x = attn_output_3_transpose_x_0, transpose_y = attn_output_3_transpose_y_0, x = attn_weights_11, y = values_11)[name = tensor("attn_output_3")]; tensor var_867 = const()[name = tensor("op_867"), val = tensor([0, 2, 1, 3])]; tensor var_870 = const()[name = tensor("op_870"), val = tensor([1, 1, 1024])]; tensor var_868 = transpose(perm = var_867, x = attn_output_3)[name = tensor("transpose_46")]; tensor input_15 = reshape(shape = var_870, x = var_868)[name = tensor("input_15")]; tensor attn_out_3 = linear(bias = linear_0_bias_0, weight = attn1_out_proj_weight, x = input_15)[name = tensor("linear_6")]; tensor var_876 = const()[name = tensor("op_876"), val = tensor(0x1p+0)]; tensor var_877 = add(x = position1, y = var_876)[name = tensor("op_877")]; tensor input_17 = add(x = input_13, y = attn_out_3)[name = tensor("input_17")]; tensor var_881 = const()[name = tensor("op_881"), val = tensor(0x1.4f8b58p-17)]; tensor input_19_axes_0 = const()[name = tensor("input_19_axes_0"), val = tensor([-1])]; tensor input_19 = layer_norm(axes = input_19_axes_0, beta = norm1_2_bias, epsilon = var_881, gamma = norm1_2_weight, x = input_17)[name = tensor("input_19")]; tensor var_889 = linear(bias = linear_3_bias_0, weight = linear1_1_weight, x = input_19)[name = tensor("linear_7")]; tensor input_21_mode_0 = const()[name = tensor("input_21_mode_0"), val = tensor("EXACT")]; tensor input_21 = gelu(mode = input_21_mode_0, x = var_889)[name = tensor("input_21")]; tensor ffn_out_3 = linear(bias = linear_0_bias_0, weight = linear1_2_weight, x = input_21)[name = tensor("linear_8")]; tensor input_23 = add(x = input_17, y = ffn_out_3)[name = tensor("input_23")]; tensor var_898 = const()[name = tensor("op_898"), val = tensor(0x1.4f8b58p-17)]; tensor x_5_axes_0 = const()[name = tensor("x_5_axes_0"), val = tensor([-1])]; tensor x_5 = layer_norm(axes = x_5_axes_0, beta = norm2_1_bias, epsilon = var_898, gamma = norm2_1_weight, x = input_23)[name = tensor("x_5")]; tensor var_930 = linear(bias = linear_1_bias_0, weight = attn2_in_proj_weight, x = x_5)[name = tensor("linear_9")]; tensor var_934 = const()[name = tensor("op_934"), val = tensor([1, 1, 3, 16, 64])]; tensor qkv_5 = reshape(shape = var_934, x = var_930)[name = tensor("qkv_5")]; tensor q_13_begin_0 = const()[name = tensor("q_13_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_13_end_0 = const()[name = tensor("q_13_end_0"), val = tensor([1, 1, 1, 16, 64])]; tensor q_13_end_mask_0 = const()[name = tensor("q_13_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_13_squeeze_mask_0 = const()[name = tensor("q_13_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_13 = slice_by_index(begin = q_13_begin_0, end = q_13_end_0, end_mask = q_13_end_mask_0, squeeze_mask = q_13_squeeze_mask_0, x = qkv_5)[name = tensor("q_13")]; tensor k_9_begin_0 = const()[name = tensor("k_9_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_9_end_0 = const()[name = tensor("k_9_end_0"), val = tensor([1, 1, 2, 16, 64])]; tensor k_9_end_mask_0 = const()[name = tensor("k_9_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_9_squeeze_mask_0 = const()[name = tensor("k_9_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_9 = slice_by_index(begin = k_9_begin_0, end = k_9_end_0, end_mask = k_9_end_mask_0, squeeze_mask = k_9_squeeze_mask_0, x = qkv_5)[name = tensor("k_9")]; tensor v_5_begin_0 = const()[name = tensor("v_5_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_5_end_0 = const()[name = tensor("v_5_end_0"), val = tensor([1, 1, 3, 16, 64])]; tensor v_5_end_mask_0 = const()[name = tensor("v_5_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_5_squeeze_mask_0 = const()[name = tensor("v_5_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_5 = slice_by_index(begin = v_5_begin_0, end = v_5_end_0, end_mask = v_5_end_mask_0, squeeze_mask = v_5_squeeze_mask_0, x = qkv_5)[name = tensor("v_5")]; tensor freqs_5 = const()[name = tensor("freqs_5"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304367616)))]; tensor var_1038 = const()[name = tensor("op_1038"), val = tensor([1, 1, 1, 1])]; tensor ts_17 = reshape(shape = var_1038, x = position2)[name = tensor("ts_17")]; tensor var_1042 = const()[name = tensor("op_1042"), val = tensor([1, 1, 16, 32, 2])]; tensor q_complex_5 = reshape(shape = var_1042, x = q_13)[name = tensor("q_complex_5")]; tensor var_1046 = const()[name = tensor("op_1046"), val = tensor([1, 1, 16, 32, 2])]; tensor k_complex_5 = reshape(shape = var_1046, x = k_9)[name = tensor("k_complex_5")]; tensor var_1050_begin_0 = const()[name = tensor("op_1050_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1050_end_0 = const()[name = tensor("op_1050_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_1050_end_mask_0 = const()[name = tensor("op_1050_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1050_squeeze_mask_0 = const()[name = tensor("op_1050_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1050 = slice_by_index(begin = var_1050_begin_0, end = var_1050_end_0, end_mask = var_1050_end_mask_0, squeeze_mask = var_1050_squeeze_mask_0, x = q_complex_5)[name = tensor("op_1050")]; tensor var_1058_begin_0 = const()[name = tensor("op_1058_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_1058_end_0 = const()[name = tensor("op_1058_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_1058_end_mask_0 = const()[name = tensor("op_1058_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1058_squeeze_mask_0 = const()[name = tensor("op_1058_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1058 = slice_by_index(begin = var_1058_begin_0, end = var_1058_end_0, end_mask = var_1058_end_mask_0, squeeze_mask = var_1058_squeeze_mask_0, x = q_complex_5)[name = tensor("op_1058")]; tensor var_1066_begin_0 = const()[name = tensor("op_1066_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1066_end_0 = const()[name = tensor("op_1066_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_1066_end_mask_0 = const()[name = tensor("op_1066_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1066_squeeze_mask_0 = const()[name = tensor("op_1066_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1066 = slice_by_index(begin = var_1066_begin_0, end = var_1066_end_0, end_mask = var_1066_end_mask_0, squeeze_mask = var_1066_squeeze_mask_0, x = k_complex_5)[name = tensor("op_1066")]; tensor var_1074_begin_0 = const()[name = tensor("op_1074_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_1074_end_0 = const()[name = tensor("op_1074_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_1074_end_mask_0 = const()[name = tensor("op_1074_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1074_squeeze_mask_0 = const()[name = tensor("op_1074_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1074 = slice_by_index(begin = var_1074_begin_0, end = var_1074_end_0, end_mask = var_1074_end_mask_0, squeeze_mask = var_1074_squeeze_mask_0, x = k_complex_5)[name = tensor("op_1074")]; tensor var_1080 = mul(x = freqs_5, y = ts_17)[name = tensor("op_1080")]; tensor rotr_5 = cos(x = var_1080)[name = tensor("rotr_5")]; tensor roti_5 = sin(x = var_1080)[name = tensor("roti_5")]; tensor var_1084 = mul(x = var_1050, y = rotr_5)[name = tensor("op_1084")]; tensor var_1085 = mul(x = var_1058, y = roti_5)[name = tensor("op_1085")]; tensor qor_9 = sub(x = var_1084, y = var_1085)[name = tensor("qor_9")]; tensor var_1088 = mul(x = var_1050, y = roti_5)[name = tensor("op_1088")]; tensor var_1089 = mul(x = var_1058, y = rotr_5)[name = tensor("op_1089")]; tensor qoi_9 = add(x = var_1088, y = var_1089)[name = tensor("qoi_9")]; tensor var_1092 = mul(x = var_1066, y = rotr_5)[name = tensor("op_1092")]; tensor var_1093 = mul(x = var_1074, y = roti_5)[name = tensor("op_1093")]; tensor kor_9 = sub(x = var_1092, y = var_1093)[name = tensor("kor_9")]; tensor var_1096 = mul(x = var_1066, y = roti_5)[name = tensor("op_1096")]; tensor var_1097 = mul(x = var_1074, y = rotr_5)[name = tensor("op_1097")]; tensor koi_9 = add(x = var_1096, y = var_1097)[name = tensor("koi_9")]; tensor qo_5_axis_0 = const()[name = tensor("qo_5_axis_0"), val = tensor(-1)]; tensor qo_5 = stack(axis = qo_5_axis_0, values = (qor_9, qoi_9))[name = tensor("qo_5")]; tensor ko_5_axis_0 = const()[name = tensor("ko_5_axis_0"), val = tensor(-1)]; tensor ko_5 = stack(axis = ko_5_axis_0, values = (kor_9, koi_9))[name = tensor("ko_5")]; tensor var_1126 = const()[name = tensor("op_1126"), val = tensor([1, 1, 16, 64])]; tensor q_15 = reshape(shape = var_1126, x = qo_5)[name = tensor("q_15")]; tensor var_1128 = const()[name = tensor("op_1128"), val = tensor([1, 1, 16, 64])]; tensor k_11 = reshape(shape = var_1128, x = ko_5)[name = tensor("k_11")]; tensor _inversed_1150_y_0 = const()[name = tensor("_inversed_1150_y_0"), val = tensor(0x1p-9)]; tensor _inversed_1150 = mul(x = ts_17, y = _inversed_1150_y_0)[name = tensor("_inversed_1150")]; tensor var_1151 = floor(x = _inversed_1150)[name = tensor("op_1151")]; tensor var_1152 = const()[name = tensor("op_1152"), val = tensor(0x1p+9)]; tensor var_1153 = mul(x = var_1151, y = var_1152)[name = tensor("op_1153")]; tensor write_indices_float_11 = sub(x = ts_17, y = var_1153)[name = tensor("write_indices_float_11")]; tensor var_1160_dtype_0 = const()[name = tensor("op_1160_dtype_0"), val = tensor("int32")]; tensor write_indices_5_reps_0 = const()[name = tensor("write_indices_5_reps_0"), val = tensor([1, 1, 16, 64])]; tensor var_1160 = cast(dtype = var_1160_dtype_0, x = write_indices_float_11)[name = tensor("cast_111")]; tensor write_indices_5 = tile(reps = write_indices_5_reps_0, x = var_1160)[name = tensor("write_indices_5")]; tensor var_1168_begin_0 = const()[name = tensor("op_1168_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1168_end_0 = const()[name = tensor("op_1168_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor var_1168_end_mask_0 = const()[name = tensor("op_1168_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_1168_squeeze_mask_0 = const()[name = tensor("op_1168_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_1168 = slice_by_index(begin = var_1168_begin_0, end = var_1168_end_0, end_mask = var_1168_end_mask_0, squeeze_mask = var_1168_squeeze_mask_0, x = cache2)[name = tensor("op_1168")]; tensor var_1170_axis_0 = const()[name = tensor("op_1170_axis_0"), val = tensor(1)]; tensor var_1170_mode_0 = const()[name = tensor("op_1170_mode_0"), val = tensor("update")]; tensor var_1170_validate_indices_0 = const()[name = tensor("op_1170_validate_indices_0"), val = tensor(false)]; tensor var_1170 = scatter_along_axis(axis = var_1170_axis_0, data = var_1168, indices = write_indices_5, mode = var_1170_mode_0, updates = k_11, validate_indices = var_1170_validate_indices_0)[name = tensor("op_1170")]; tensor concat_16 = const()[name = tensor("concat_16"), val = tensor([0, 0, 0, 0, 0])]; tensor concat_17 = const()[name = tensor("concat_17"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_5_internal_tensor_assign_1_stride_0 = const()[name = tensor("new_cache_5_internal_tensor_assign_1_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_5_internal_tensor_assign_1_begin_mask_0 = const()[name = tensor("new_cache_5_internal_tensor_assign_1_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_5_internal_tensor_assign_1_end_mask_0 = const()[name = tensor("new_cache_5_internal_tensor_assign_1_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_5_internal_tensor_assign_1_squeeze_mask_0 = const()[name = tensor("new_cache_5_internal_tensor_assign_1_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_16 = const()[name = tensor("shape_16"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_4 = const()[name = tensor("reduce_prod_4"), val = tensor(1048576)]; tensor range_1d_4_start_0 = const()[name = tensor("range_1d_4_start_0"), val = tensor(0)]; tensor range_1d_4_step_0 = const()[name = tensor("range_1d_4_step_0"), val = tensor(1)]; tensor range_1d_4 = range_1d(end = reduce_prod_4, start = range_1d_4_start_0, step = range_1d_4_step_0)[name = tensor("range_1d_4")]; tensor reshape_20 = reshape(shape = shape_16, x = range_1d_4)[name = tensor("reshape_20")]; tensor slice_by_index_4 = slice_by_index(begin = concat_16, begin_mask = new_cache_5_internal_tensor_assign_1_begin_mask_0, end = concat_17, end_mask = new_cache_5_internal_tensor_assign_1_end_mask_0, squeeze_mask = new_cache_5_internal_tensor_assign_1_squeeze_mask_0, stride = new_cache_5_internal_tensor_assign_1_stride_0, x = reshape_20)[name = tensor("slice_by_index_4")]; tensor reshape_21_shape_0 = const()[name = tensor("reshape_21_shape_0"), val = tensor([-1])]; tensor reshape_21 = reshape(shape = reshape_21_shape_0, x = slice_by_index_4)[name = tensor("reshape_21")]; tensor reshape_22_shape_0 = const()[name = tensor("reshape_22_shape_0"), val = tensor([-1])]; tensor reshape_22 = reshape(shape = reshape_22_shape_0, x = var_1170)[name = tensor("reshape_22")]; tensor reshape_23_shape_0 = const()[name = tensor("reshape_23_shape_0"), val = tensor([-1])]; tensor reshape_23 = reshape(shape = reshape_23_shape_0, x = cache2)[name = tensor("reshape_23")]; tensor scatter_4_mode_0 = const()[name = tensor("scatter_4_mode_0"), val = tensor("update")]; tensor scatter_4_axis_0 = const()[name = tensor("scatter_4_axis_0"), val = tensor(0)]; tensor scatter_4_validate_indices_0 = const()[name = tensor("scatter_4_validate_indices_0"), val = tensor(false)]; tensor scatter_4 = scatter(axis = scatter_4_axis_0, data = reshape_23, indices = reshape_21, mode = scatter_4_mode_0, updates = reshape_22, validate_indices = scatter_4_validate_indices_0)[name = tensor("scatter_4")]; tensor reshape_24 = reshape(shape = shape_16, x = scatter_4)[name = tensor("reshape_24")]; tensor var_1178_begin_0 = const()[name = tensor("op_1178_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor var_1178_end_0 = const()[name = tensor("op_1178_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor var_1178_end_mask_0 = const()[name = tensor("op_1178_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_1178_squeeze_mask_0 = const()[name = tensor("op_1178_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_1178 = slice_by_index(begin = var_1178_begin_0, end = var_1178_end_0, end_mask = var_1178_end_mask_0, squeeze_mask = var_1178_squeeze_mask_0, x = reshape_24)[name = tensor("op_1178")]; tensor var_1180_axis_0 = const()[name = tensor("op_1180_axis_0"), val = tensor(1)]; tensor var_1180_mode_0 = const()[name = tensor("op_1180_mode_0"), val = tensor("update")]; tensor var_1180_validate_indices_0 = const()[name = tensor("op_1180_validate_indices_0"), val = tensor(false)]; tensor var_1180 = scatter_along_axis(axis = var_1180_axis_0, data = var_1178, indices = write_indices_5, mode = var_1180_mode_0, updates = v_5, validate_indices = var_1180_validate_indices_0)[name = tensor("op_1180")]; tensor concat_18 = const()[name = tensor("concat_18"), val = tensor([1, 0, 0, 0, 0])]; tensor concat_19 = const()[name = tensor("concat_19"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_5_internal_tensor_assign_2_stride_0 = const()[name = tensor("new_cache_5_internal_tensor_assign_2_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_5_internal_tensor_assign_2_begin_mask_0 = const()[name = tensor("new_cache_5_internal_tensor_assign_2_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_5_internal_tensor_assign_2_end_mask_0 = const()[name = tensor("new_cache_5_internal_tensor_assign_2_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_5_internal_tensor_assign_2_squeeze_mask_0 = const()[name = tensor("new_cache_5_internal_tensor_assign_2_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_17 = const()[name = tensor("shape_17"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_5 = const()[name = tensor("reduce_prod_5"), val = tensor(1048576)]; tensor range_1d_5_start_0 = const()[name = tensor("range_1d_5_start_0"), val = tensor(0)]; tensor range_1d_5_step_0 = const()[name = tensor("range_1d_5_step_0"), val = tensor(1)]; tensor range_1d_5 = range_1d(end = reduce_prod_5, start = range_1d_5_start_0, step = range_1d_5_step_0)[name = tensor("range_1d_5")]; tensor reshape_25 = reshape(shape = shape_17, x = range_1d_5)[name = tensor("reshape_25")]; tensor slice_by_index_5 = slice_by_index(begin = concat_18, begin_mask = new_cache_5_internal_tensor_assign_2_begin_mask_0, end = concat_19, end_mask = new_cache_5_internal_tensor_assign_2_end_mask_0, squeeze_mask = new_cache_5_internal_tensor_assign_2_squeeze_mask_0, stride = new_cache_5_internal_tensor_assign_2_stride_0, x = reshape_25)[name = tensor("slice_by_index_5")]; tensor reshape_26_shape_0 = const()[name = tensor("reshape_26_shape_0"), val = tensor([-1])]; tensor reshape_26 = reshape(shape = reshape_26_shape_0, x = slice_by_index_5)[name = tensor("reshape_26")]; tensor reshape_27_shape_0 = const()[name = tensor("reshape_27_shape_0"), val = tensor([-1])]; tensor reshape_27 = reshape(shape = reshape_27_shape_0, x = var_1180)[name = tensor("reshape_27")]; tensor reshape_28_shape_0 = const()[name = tensor("reshape_28_shape_0"), val = tensor([-1])]; tensor reshape_28 = reshape(shape = reshape_28_shape_0, x = reshape_24)[name = tensor("reshape_28")]; tensor scatter_5_mode_0 = const()[name = tensor("scatter_5_mode_0"), val = tensor("update")]; tensor scatter_5_axis_0 = const()[name = tensor("scatter_5_axis_0"), val = tensor(0)]; tensor scatter_5_validate_indices_0 = const()[name = tensor("scatter_5_validate_indices_0"), val = tensor(false)]; tensor scatter_5 = scatter(axis = scatter_5_axis_0, data = reshape_28, indices = reshape_26, mode = scatter_5_mode_0, updates = reshape_27, validate_indices = scatter_5_validate_indices_0)[name = tensor("scatter_5")]; tensor new_cache_5_internal_tensor_assign_2 = reshape(shape = shape_17, x = scatter_5)[name = tensor("reshape_29")]; tensor keys_13_begin_0 = const()[name = tensor("keys_13_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor keys_13_end_0 = const()[name = tensor("keys_13_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor keys_13_end_mask_0 = const()[name = tensor("keys_13_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor keys_13_squeeze_mask_0 = const()[name = tensor("keys_13_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor keys_13 = slice_by_index(begin = keys_13_begin_0, end = keys_13_end_0, end_mask = keys_13_end_mask_0, squeeze_mask = keys_13_squeeze_mask_0, x = new_cache_5_internal_tensor_assign_2)[name = tensor("keys_13")]; tensor values_13_begin_0 = const()[name = tensor("values_13_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor values_13_end_0 = const()[name = tensor("values_13_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor values_13_end_mask_0 = const()[name = tensor("values_13_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor values_13_squeeze_mask_0 = const()[name = tensor("values_13_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor values_13 = slice_by_index(begin = values_13_begin_0, end = values_13_end_0, end_mask = values_13_end_mask_0, squeeze_mask = values_13_squeeze_mask_0, x = new_cache_5_internal_tensor_assign_2)[name = tensor("values_13")]; tensor var_1192 = not_equal(x = keys_13, y = keys_13)[name = tensor("op_1192")]; tensor keys_15 = select(a = var_360, b = keys_13, cond = var_1192)[name = tensor("keys_15")]; tensor var_1200 = not_equal(x = values_13, y = values_13)[name = tensor("op_1200")]; tensor values_15 = select(a = var_360, b = values_13, cond = var_1200)[name = tensor("values_15")]; tensor var_1224 = const()[name = tensor("op_1224"), val = tensor([0, 2, 1, 3])]; tensor var_1237 = const()[name = tensor("op_1237"), val = tensor([1, 1, 1])]; tensor var_1238 = reshape(shape = var_1237, x = position2)[name = tensor("op_1238")]; tensor var_1255 = const()[name = tensor("op_1255"), val = tensor(0x1p+0)]; tensor valid_len_5 = add(x = var_1238, y = var_1255)[name = tensor("valid_len_5")]; tensor valid_mask_5 = less(x = k_positions_1_promoted, y = valid_len_5)[name = tensor("valid_mask_5")]; tensor causal_mask_5 = less_equal(x = k_positions_1_promoted, y = var_1238)[name = tensor("causal_mask_5")]; tensor attn_mask_9 = logical_and(x = valid_mask_5, y = causal_mask_5)[name = tensor("attn_mask_9")]; tensor attn_mask_11_axes_0 = const()[name = tensor("attn_mask_11_axes_0"), val = tensor([1])]; tensor attn_mask_11 = expand_dims(axes = attn_mask_11_axes_0, x = attn_mask_9)[name = tensor("attn_mask_11")]; tensor var_1267 = const()[name = tensor("op_1267"), val = tensor([0x1.fffe5cp-4])]; tensor var_1273_transpose_x_0 = const()[name = tensor("op_1273_transpose_x_0"), val = tensor(false)]; tensor var_1273_transpose_y_0 = const()[name = tensor("op_1273_transpose_y_0"), val = tensor(false)]; tensor transpose_22_perm_0 = const()[name = tensor("transpose_22_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_23_perm_0 = const()[name = tensor("transpose_23_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_23 = transpose(perm = transpose_23_perm_0, x = keys_15)[name = tensor("transpose_43")]; tensor transpose_22 = transpose(perm = transpose_22_perm_0, x = q_15)[name = tensor("transpose_44")]; tensor var_1273 = matmul(transpose_x = var_1273_transpose_x_0, transpose_y = var_1273_transpose_y_0, x = transpose_22, y = transpose_23)[name = tensor("op_1273")]; tensor attn_weights_13 = mul(x = var_1273, y = var_1267)[name = tensor("attn_weights_13")]; tensor var_1275 = logical_not(x = attn_mask_11)[name = tensor("op_1275")]; tensor var_1276 = const()[name = tensor("op_1276"), val = tensor(-0x1.ff933cp+127)]; tensor attn_weights_15 = select(a = var_1276, b = attn_weights_13, cond = var_1275)[name = tensor("attn_weights_15")]; tensor var_1278 = const()[name = tensor("op_1278"), val = tensor(-1)]; tensor attn_weights_17 = softmax(axis = var_1278, x = attn_weights_15)[name = tensor("attn_weights_17")]; tensor attn_output_5_transpose_x_0 = const()[name = tensor("attn_output_5_transpose_x_0"), val = tensor(false)]; tensor attn_output_5_transpose_y_0 = const()[name = tensor("attn_output_5_transpose_y_0"), val = tensor(false)]; tensor values_17 = transpose(perm = var_1224, x = values_15)[name = tensor("transpose_45")]; tensor attn_output_5 = matmul(transpose_x = attn_output_5_transpose_x_0, transpose_y = attn_output_5_transpose_y_0, x = attn_weights_17, y = values_17)[name = tensor("attn_output_5")]; tensor var_1286 = const()[name = tensor("op_1286"), val = tensor([0, 2, 1, 3])]; tensor var_1289 = const()[name = tensor("op_1289"), val = tensor([1, 1, 1024])]; tensor var_1287 = transpose(perm = var_1286, x = attn_output_5)[name = tensor("transpose_42")]; tensor input_25 = reshape(shape = var_1289, x = var_1287)[name = tensor("input_25")]; tensor attn_out_5 = linear(bias = linear_0_bias_0, weight = attn2_out_proj_weight, x = input_25)[name = tensor("linear_10")]; tensor var_1295 = const()[name = tensor("op_1295"), val = tensor(0x1p+0)]; tensor var_1296 = add(x = position2, y = var_1295)[name = tensor("op_1296")]; tensor input_27 = add(x = input_23, y = attn_out_5)[name = tensor("input_27")]; tensor var_1300 = const()[name = tensor("op_1300"), val = tensor(0x1.4f8b58p-17)]; tensor input_29_axes_0 = const()[name = tensor("input_29_axes_0"), val = tensor([-1])]; tensor input_29 = layer_norm(axes = input_29_axes_0, beta = norm2_2_bias, epsilon = var_1300, gamma = norm2_2_weight, x = input_27)[name = tensor("input_29")]; tensor var_1308 = linear(bias = linear_3_bias_0, weight = linear2_1_weight, x = input_29)[name = tensor("linear_11")]; tensor input_31_mode_0 = const()[name = tensor("input_31_mode_0"), val = tensor("EXACT")]; tensor input_31 = gelu(mode = input_31_mode_0, x = var_1308)[name = tensor("input_31")]; tensor ffn_out_5 = linear(bias = linear_0_bias_0, weight = linear2_2_weight, x = input_31)[name = tensor("linear_12")]; tensor input_33 = add(x = input_27, y = ffn_out_5)[name = tensor("input_33")]; tensor var_1317 = const()[name = tensor("op_1317"), val = tensor(0x1.4f8b58p-17)]; tensor x_7_axes_0 = const()[name = tensor("x_7_axes_0"), val = tensor([-1])]; tensor x_7 = layer_norm(axes = x_7_axes_0, beta = norm3_1_bias, epsilon = var_1317, gamma = norm3_1_weight, x = input_33)[name = tensor("x_7")]; tensor var_1349 = linear(bias = linear_1_bias_0, weight = attn3_in_proj_weight, x = x_7)[name = tensor("linear_13")]; tensor var_1353 = const()[name = tensor("op_1353"), val = tensor([1, 1, 3, 16, 64])]; tensor qkv_7 = reshape(shape = var_1353, x = var_1349)[name = tensor("qkv_7")]; tensor q_19_begin_0 = const()[name = tensor("q_19_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_19_end_0 = const()[name = tensor("q_19_end_0"), val = tensor([1, 1, 1, 16, 64])]; tensor q_19_end_mask_0 = const()[name = tensor("q_19_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_19_squeeze_mask_0 = const()[name = tensor("q_19_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_19 = slice_by_index(begin = q_19_begin_0, end = q_19_end_0, end_mask = q_19_end_mask_0, squeeze_mask = q_19_squeeze_mask_0, x = qkv_7)[name = tensor("q_19")]; tensor k_13_begin_0 = const()[name = tensor("k_13_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_13_end_0 = const()[name = tensor("k_13_end_0"), val = tensor([1, 1, 2, 16, 64])]; tensor k_13_end_mask_0 = const()[name = tensor("k_13_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_13_squeeze_mask_0 = const()[name = tensor("k_13_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_13 = slice_by_index(begin = k_13_begin_0, end = k_13_end_0, end_mask = k_13_end_mask_0, squeeze_mask = k_13_squeeze_mask_0, x = qkv_7)[name = tensor("k_13")]; tensor v_7_begin_0 = const()[name = tensor("v_7_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_7_end_0 = const()[name = tensor("v_7_end_0"), val = tensor([1, 1, 3, 16, 64])]; tensor v_7_end_mask_0 = const()[name = tensor("v_7_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_7_squeeze_mask_0 = const()[name = tensor("v_7_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_7 = slice_by_index(begin = v_7_begin_0, end = v_7_end_0, end_mask = v_7_end_mask_0, squeeze_mask = v_7_squeeze_mask_0, x = qkv_7)[name = tensor("v_7")]; tensor freqs_7 = const()[name = tensor("freqs_7"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304367808)))]; tensor var_1457 = const()[name = tensor("op_1457"), val = tensor([1, 1, 1, 1])]; tensor ts_23 = reshape(shape = var_1457, x = position3)[name = tensor("ts_23")]; tensor var_1461 = const()[name = tensor("op_1461"), val = tensor([1, 1, 16, 32, 2])]; tensor q_complex_7 = reshape(shape = var_1461, x = q_19)[name = tensor("q_complex_7")]; tensor var_1465 = const()[name = tensor("op_1465"), val = tensor([1, 1, 16, 32, 2])]; tensor k_complex_7 = reshape(shape = var_1465, x = k_13)[name = tensor("k_complex_7")]; tensor var_1469_begin_0 = const()[name = tensor("op_1469_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1469_end_0 = const()[name = tensor("op_1469_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_1469_end_mask_0 = const()[name = tensor("op_1469_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1469_squeeze_mask_0 = const()[name = tensor("op_1469_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1469 = slice_by_index(begin = var_1469_begin_0, end = var_1469_end_0, end_mask = var_1469_end_mask_0, squeeze_mask = var_1469_squeeze_mask_0, x = q_complex_7)[name = tensor("op_1469")]; tensor var_1477_begin_0 = const()[name = tensor("op_1477_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_1477_end_0 = const()[name = tensor("op_1477_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_1477_end_mask_0 = const()[name = tensor("op_1477_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1477_squeeze_mask_0 = const()[name = tensor("op_1477_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1477 = slice_by_index(begin = var_1477_begin_0, end = var_1477_end_0, end_mask = var_1477_end_mask_0, squeeze_mask = var_1477_squeeze_mask_0, x = q_complex_7)[name = tensor("op_1477")]; tensor var_1485_begin_0 = const()[name = tensor("op_1485_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1485_end_0 = const()[name = tensor("op_1485_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_1485_end_mask_0 = const()[name = tensor("op_1485_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1485_squeeze_mask_0 = const()[name = tensor("op_1485_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1485 = slice_by_index(begin = var_1485_begin_0, end = var_1485_end_0, end_mask = var_1485_end_mask_0, squeeze_mask = var_1485_squeeze_mask_0, x = k_complex_7)[name = tensor("op_1485")]; tensor var_1493_begin_0 = const()[name = tensor("op_1493_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_1493_end_0 = const()[name = tensor("op_1493_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_1493_end_mask_0 = const()[name = tensor("op_1493_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1493_squeeze_mask_0 = const()[name = tensor("op_1493_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1493 = slice_by_index(begin = var_1493_begin_0, end = var_1493_end_0, end_mask = var_1493_end_mask_0, squeeze_mask = var_1493_squeeze_mask_0, x = k_complex_7)[name = tensor("op_1493")]; tensor var_1499 = mul(x = freqs_7, y = ts_23)[name = tensor("op_1499")]; tensor rotr_7 = cos(x = var_1499)[name = tensor("rotr_7")]; tensor roti_7 = sin(x = var_1499)[name = tensor("roti_7")]; tensor var_1503 = mul(x = var_1469, y = rotr_7)[name = tensor("op_1503")]; tensor var_1504 = mul(x = var_1477, y = roti_7)[name = tensor("op_1504")]; tensor qor_13 = sub(x = var_1503, y = var_1504)[name = tensor("qor_13")]; tensor var_1507 = mul(x = var_1469, y = roti_7)[name = tensor("op_1507")]; tensor var_1508 = mul(x = var_1477, y = rotr_7)[name = tensor("op_1508")]; tensor qoi_13 = add(x = var_1507, y = var_1508)[name = tensor("qoi_13")]; tensor var_1511 = mul(x = var_1485, y = rotr_7)[name = tensor("op_1511")]; tensor var_1512 = mul(x = var_1493, y = roti_7)[name = tensor("op_1512")]; tensor kor_13 = sub(x = var_1511, y = var_1512)[name = tensor("kor_13")]; tensor var_1515 = mul(x = var_1485, y = roti_7)[name = tensor("op_1515")]; tensor var_1516 = mul(x = var_1493, y = rotr_7)[name = tensor("op_1516")]; tensor koi_13 = add(x = var_1515, y = var_1516)[name = tensor("koi_13")]; tensor qo_7_axis_0 = const()[name = tensor("qo_7_axis_0"), val = tensor(-1)]; tensor qo_7 = stack(axis = qo_7_axis_0, values = (qor_13, qoi_13))[name = tensor("qo_7")]; tensor ko_7_axis_0 = const()[name = tensor("ko_7_axis_0"), val = tensor(-1)]; tensor ko_7 = stack(axis = ko_7_axis_0, values = (kor_13, koi_13))[name = tensor("ko_7")]; tensor var_1545 = const()[name = tensor("op_1545"), val = tensor([1, 1, 16, 64])]; tensor q_21 = reshape(shape = var_1545, x = qo_7)[name = tensor("q_21")]; tensor var_1547 = const()[name = tensor("op_1547"), val = tensor([1, 1, 16, 64])]; tensor k_15 = reshape(shape = var_1547, x = ko_7)[name = tensor("k_15")]; tensor _inversed_1569_y_0 = const()[name = tensor("_inversed_1569_y_0"), val = tensor(0x1p-9)]; tensor _inversed_1569 = mul(x = ts_23, y = _inversed_1569_y_0)[name = tensor("_inversed_1569")]; tensor var_1570 = floor(x = _inversed_1569)[name = tensor("op_1570")]; tensor var_1571 = const()[name = tensor("op_1571"), val = tensor(0x1p+9)]; tensor var_1572 = mul(x = var_1570, y = var_1571)[name = tensor("op_1572")]; tensor write_indices_float_15 = sub(x = ts_23, y = var_1572)[name = tensor("write_indices_float_15")]; tensor var_1579_dtype_0 = const()[name = tensor("op_1579_dtype_0"), val = tensor("int32")]; tensor write_indices_7_reps_0 = const()[name = tensor("write_indices_7_reps_0"), val = tensor([1, 1, 16, 64])]; tensor var_1579 = cast(dtype = var_1579_dtype_0, x = write_indices_float_15)[name = tensor("cast_110")]; tensor write_indices_7 = tile(reps = write_indices_7_reps_0, x = var_1579)[name = tensor("write_indices_7")]; tensor var_1587_begin_0 = const()[name = tensor("op_1587_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1587_end_0 = const()[name = tensor("op_1587_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor var_1587_end_mask_0 = const()[name = tensor("op_1587_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_1587_squeeze_mask_0 = const()[name = tensor("op_1587_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_1587 = slice_by_index(begin = var_1587_begin_0, end = var_1587_end_0, end_mask = var_1587_end_mask_0, squeeze_mask = var_1587_squeeze_mask_0, x = cache3)[name = tensor("op_1587")]; tensor var_1589_axis_0 = const()[name = tensor("op_1589_axis_0"), val = tensor(1)]; tensor var_1589_mode_0 = const()[name = tensor("op_1589_mode_0"), val = tensor("update")]; tensor var_1589_validate_indices_0 = const()[name = tensor("op_1589_validate_indices_0"), val = tensor(false)]; tensor var_1589 = scatter_along_axis(axis = var_1589_axis_0, data = var_1587, indices = write_indices_7, mode = var_1589_mode_0, updates = k_15, validate_indices = var_1589_validate_indices_0)[name = tensor("op_1589")]; tensor concat_23 = const()[name = tensor("concat_23"), val = tensor([0, 0, 0, 0, 0])]; tensor concat_24 = const()[name = tensor("concat_24"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_7_internal_tensor_assign_1_stride_0 = const()[name = tensor("new_cache_7_internal_tensor_assign_1_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_7_internal_tensor_assign_1_begin_mask_0 = const()[name = tensor("new_cache_7_internal_tensor_assign_1_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_7_internal_tensor_assign_1_end_mask_0 = const()[name = tensor("new_cache_7_internal_tensor_assign_1_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_7_internal_tensor_assign_1_squeeze_mask_0 = const()[name = tensor("new_cache_7_internal_tensor_assign_1_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_18 = const()[name = tensor("shape_18"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_6 = const()[name = tensor("reduce_prod_6"), val = tensor(1048576)]; tensor range_1d_6_start_0 = const()[name = tensor("range_1d_6_start_0"), val = tensor(0)]; tensor range_1d_6_step_0 = const()[name = tensor("range_1d_6_step_0"), val = tensor(1)]; tensor range_1d_6 = range_1d(end = reduce_prod_6, start = range_1d_6_start_0, step = range_1d_6_step_0)[name = tensor("range_1d_6")]; tensor reshape_30 = reshape(shape = shape_18, x = range_1d_6)[name = tensor("reshape_30")]; tensor slice_by_index_6 = slice_by_index(begin = concat_23, begin_mask = new_cache_7_internal_tensor_assign_1_begin_mask_0, end = concat_24, end_mask = new_cache_7_internal_tensor_assign_1_end_mask_0, squeeze_mask = new_cache_7_internal_tensor_assign_1_squeeze_mask_0, stride = new_cache_7_internal_tensor_assign_1_stride_0, x = reshape_30)[name = tensor("slice_by_index_6")]; tensor reshape_31_shape_0 = const()[name = tensor("reshape_31_shape_0"), val = tensor([-1])]; tensor reshape_31 = reshape(shape = reshape_31_shape_0, x = slice_by_index_6)[name = tensor("reshape_31")]; tensor reshape_32_shape_0 = const()[name = tensor("reshape_32_shape_0"), val = tensor([-1])]; tensor reshape_32 = reshape(shape = reshape_32_shape_0, x = var_1589)[name = tensor("reshape_32")]; tensor reshape_33_shape_0 = const()[name = tensor("reshape_33_shape_0"), val = tensor([-1])]; tensor reshape_33 = reshape(shape = reshape_33_shape_0, x = cache3)[name = tensor("reshape_33")]; tensor scatter_6_mode_0 = const()[name = tensor("scatter_6_mode_0"), val = tensor("update")]; tensor scatter_6_axis_0 = const()[name = tensor("scatter_6_axis_0"), val = tensor(0)]; tensor scatter_6_validate_indices_0 = const()[name = tensor("scatter_6_validate_indices_0"), val = tensor(false)]; tensor scatter_6 = scatter(axis = scatter_6_axis_0, data = reshape_33, indices = reshape_31, mode = scatter_6_mode_0, updates = reshape_32, validate_indices = scatter_6_validate_indices_0)[name = tensor("scatter_6")]; tensor reshape_34 = reshape(shape = shape_18, x = scatter_6)[name = tensor("reshape_34")]; tensor var_1597_begin_0 = const()[name = tensor("op_1597_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor var_1597_end_0 = const()[name = tensor("op_1597_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor var_1597_end_mask_0 = const()[name = tensor("op_1597_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_1597_squeeze_mask_0 = const()[name = tensor("op_1597_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_1597 = slice_by_index(begin = var_1597_begin_0, end = var_1597_end_0, end_mask = var_1597_end_mask_0, squeeze_mask = var_1597_squeeze_mask_0, x = reshape_34)[name = tensor("op_1597")]; tensor var_1599_axis_0 = const()[name = tensor("op_1599_axis_0"), val = tensor(1)]; tensor var_1599_mode_0 = const()[name = tensor("op_1599_mode_0"), val = tensor("update")]; tensor var_1599_validate_indices_0 = const()[name = tensor("op_1599_validate_indices_0"), val = tensor(false)]; tensor var_1599 = scatter_along_axis(axis = var_1599_axis_0, data = var_1597, indices = write_indices_7, mode = var_1599_mode_0, updates = v_7, validate_indices = var_1599_validate_indices_0)[name = tensor("op_1599")]; tensor concat_25 = const()[name = tensor("concat_25"), val = tensor([1, 0, 0, 0, 0])]; tensor concat_26 = const()[name = tensor("concat_26"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_7_internal_tensor_assign_2_stride_0 = const()[name = tensor("new_cache_7_internal_tensor_assign_2_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_7_internal_tensor_assign_2_begin_mask_0 = const()[name = tensor("new_cache_7_internal_tensor_assign_2_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_7_internal_tensor_assign_2_end_mask_0 = const()[name = tensor("new_cache_7_internal_tensor_assign_2_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_7_internal_tensor_assign_2_squeeze_mask_0 = const()[name = tensor("new_cache_7_internal_tensor_assign_2_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_19 = const()[name = tensor("shape_19"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_7 = const()[name = tensor("reduce_prod_7"), val = tensor(1048576)]; tensor range_1d_7_start_0 = const()[name = tensor("range_1d_7_start_0"), val = tensor(0)]; tensor range_1d_7_step_0 = const()[name = tensor("range_1d_7_step_0"), val = tensor(1)]; tensor range_1d_7 = range_1d(end = reduce_prod_7, start = range_1d_7_start_0, step = range_1d_7_step_0)[name = tensor("range_1d_7")]; tensor reshape_35 = reshape(shape = shape_19, x = range_1d_7)[name = tensor("reshape_35")]; tensor slice_by_index_7 = slice_by_index(begin = concat_25, begin_mask = new_cache_7_internal_tensor_assign_2_begin_mask_0, end = concat_26, end_mask = new_cache_7_internal_tensor_assign_2_end_mask_0, squeeze_mask = new_cache_7_internal_tensor_assign_2_squeeze_mask_0, stride = new_cache_7_internal_tensor_assign_2_stride_0, x = reshape_35)[name = tensor("slice_by_index_7")]; tensor reshape_36_shape_0 = const()[name = tensor("reshape_36_shape_0"), val = tensor([-1])]; tensor reshape_36 = reshape(shape = reshape_36_shape_0, x = slice_by_index_7)[name = tensor("reshape_36")]; tensor reshape_37_shape_0 = const()[name = tensor("reshape_37_shape_0"), val = tensor([-1])]; tensor reshape_37 = reshape(shape = reshape_37_shape_0, x = var_1599)[name = tensor("reshape_37")]; tensor reshape_38_shape_0 = const()[name = tensor("reshape_38_shape_0"), val = tensor([-1])]; tensor reshape_38 = reshape(shape = reshape_38_shape_0, x = reshape_34)[name = tensor("reshape_38")]; tensor scatter_7_mode_0 = const()[name = tensor("scatter_7_mode_0"), val = tensor("update")]; tensor scatter_7_axis_0 = const()[name = tensor("scatter_7_axis_0"), val = tensor(0)]; tensor scatter_7_validate_indices_0 = const()[name = tensor("scatter_7_validate_indices_0"), val = tensor(false)]; tensor scatter_7 = scatter(axis = scatter_7_axis_0, data = reshape_38, indices = reshape_36, mode = scatter_7_mode_0, updates = reshape_37, validate_indices = scatter_7_validate_indices_0)[name = tensor("scatter_7")]; tensor new_cache_7_internal_tensor_assign_2 = reshape(shape = shape_19, x = scatter_7)[name = tensor("reshape_39")]; tensor keys_19_begin_0 = const()[name = tensor("keys_19_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor keys_19_end_0 = const()[name = tensor("keys_19_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor keys_19_end_mask_0 = const()[name = tensor("keys_19_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor keys_19_squeeze_mask_0 = const()[name = tensor("keys_19_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor keys_19 = slice_by_index(begin = keys_19_begin_0, end = keys_19_end_0, end_mask = keys_19_end_mask_0, squeeze_mask = keys_19_squeeze_mask_0, x = new_cache_7_internal_tensor_assign_2)[name = tensor("keys_19")]; tensor values_19_begin_0 = const()[name = tensor("values_19_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor values_19_end_0 = const()[name = tensor("values_19_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor values_19_end_mask_0 = const()[name = tensor("values_19_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor values_19_squeeze_mask_0 = const()[name = tensor("values_19_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor values_19 = slice_by_index(begin = values_19_begin_0, end = values_19_end_0, end_mask = values_19_end_mask_0, squeeze_mask = values_19_squeeze_mask_0, x = new_cache_7_internal_tensor_assign_2)[name = tensor("values_19")]; tensor var_1611 = not_equal(x = keys_19, y = keys_19)[name = tensor("op_1611")]; tensor keys_21 = select(a = var_360, b = keys_19, cond = var_1611)[name = tensor("keys_21")]; tensor var_1619 = not_equal(x = values_19, y = values_19)[name = tensor("op_1619")]; tensor values_21 = select(a = var_360, b = values_19, cond = var_1619)[name = tensor("values_21")]; tensor var_1643 = const()[name = tensor("op_1643"), val = tensor([0, 2, 1, 3])]; tensor var_1656 = const()[name = tensor("op_1656"), val = tensor([1, 1, 1])]; tensor var_1657 = reshape(shape = var_1656, x = position3)[name = tensor("op_1657")]; tensor var_1674 = const()[name = tensor("op_1674"), val = tensor(0x1p+0)]; tensor valid_len_7 = add(x = var_1657, y = var_1674)[name = tensor("valid_len_7")]; tensor valid_mask_7 = less(x = k_positions_1_promoted, y = valid_len_7)[name = tensor("valid_mask_7")]; tensor causal_mask_7 = less_equal(x = k_positions_1_promoted, y = var_1657)[name = tensor("causal_mask_7")]; tensor attn_mask_13 = logical_and(x = valid_mask_7, y = causal_mask_7)[name = tensor("attn_mask_13")]; tensor attn_mask_15_axes_0 = const()[name = tensor("attn_mask_15_axes_0"), val = tensor([1])]; tensor attn_mask_15 = expand_dims(axes = attn_mask_15_axes_0, x = attn_mask_13)[name = tensor("attn_mask_15")]; tensor var_1686 = const()[name = tensor("op_1686"), val = tensor([0x1.fffe5cp-4])]; tensor var_1692_transpose_x_0 = const()[name = tensor("op_1692_transpose_x_0"), val = tensor(false)]; tensor var_1692_transpose_y_0 = const()[name = tensor("op_1692_transpose_y_0"), val = tensor(false)]; tensor transpose_24_perm_0 = const()[name = tensor("transpose_24_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_25_perm_0 = const()[name = tensor("transpose_25_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_25 = transpose(perm = transpose_25_perm_0, x = keys_21)[name = tensor("transpose_39")]; tensor transpose_24 = transpose(perm = transpose_24_perm_0, x = q_21)[name = tensor("transpose_40")]; tensor var_1692 = matmul(transpose_x = var_1692_transpose_x_0, transpose_y = var_1692_transpose_y_0, x = transpose_24, y = transpose_25)[name = tensor("op_1692")]; tensor attn_weights_19 = mul(x = var_1692, y = var_1686)[name = tensor("attn_weights_19")]; tensor var_1694 = logical_not(x = attn_mask_15)[name = tensor("op_1694")]; tensor var_1695 = const()[name = tensor("op_1695"), val = tensor(-0x1.ff933cp+127)]; tensor attn_weights_21 = select(a = var_1695, b = attn_weights_19, cond = var_1694)[name = tensor("attn_weights_21")]; tensor var_1697 = const()[name = tensor("op_1697"), val = tensor(-1)]; tensor attn_weights_23 = softmax(axis = var_1697, x = attn_weights_21)[name = tensor("attn_weights_23")]; tensor attn_output_7_transpose_x_0 = const()[name = tensor("attn_output_7_transpose_x_0"), val = tensor(false)]; tensor attn_output_7_transpose_y_0 = const()[name = tensor("attn_output_7_transpose_y_0"), val = tensor(false)]; tensor values_23 = transpose(perm = var_1643, x = values_21)[name = tensor("transpose_41")]; tensor attn_output_7 = matmul(transpose_x = attn_output_7_transpose_x_0, transpose_y = attn_output_7_transpose_y_0, x = attn_weights_23, y = values_23)[name = tensor("attn_output_7")]; tensor var_1705 = const()[name = tensor("op_1705"), val = tensor([0, 2, 1, 3])]; tensor var_1708 = const()[name = tensor("op_1708"), val = tensor([1, 1, 1024])]; tensor var_1706 = transpose(perm = var_1705, x = attn_output_7)[name = tensor("transpose_38")]; tensor input_35 = reshape(shape = var_1708, x = var_1706)[name = tensor("input_35")]; tensor attn_out_7 = linear(bias = linear_0_bias_0, weight = attn3_out_proj_weight, x = input_35)[name = tensor("linear_14")]; tensor var_1714 = const()[name = tensor("op_1714"), val = tensor(0x1p+0)]; tensor var_1715 = add(x = position3, y = var_1714)[name = tensor("op_1715")]; tensor input_37 = add(x = input_33, y = attn_out_7)[name = tensor("input_37")]; tensor var_1719 = const()[name = tensor("op_1719"), val = tensor(0x1.4f8b58p-17)]; tensor input_39_axes_0 = const()[name = tensor("input_39_axes_0"), val = tensor([-1])]; tensor input_39 = layer_norm(axes = input_39_axes_0, beta = norm3_2_bias, epsilon = var_1719, gamma = norm3_2_weight, x = input_37)[name = tensor("input_39")]; tensor var_1727 = linear(bias = linear_3_bias_0, weight = linear3_1_weight, x = input_39)[name = tensor("linear_15")]; tensor input_41_mode_0 = const()[name = tensor("input_41_mode_0"), val = tensor("EXACT")]; tensor input_41 = gelu(mode = input_41_mode_0, x = var_1727)[name = tensor("input_41")]; tensor ffn_out_7 = linear(bias = linear_0_bias_0, weight = linear3_2_weight, x = input_41)[name = tensor("linear_16")]; tensor input_43 = add(x = input_37, y = ffn_out_7)[name = tensor("input_43")]; tensor var_1736 = const()[name = tensor("op_1736"), val = tensor(0x1.4f8b58p-17)]; tensor x_9_axes_0 = const()[name = tensor("x_9_axes_0"), val = tensor([-1])]; tensor x_9 = layer_norm(axes = x_9_axes_0, beta = norm4_1_bias, epsilon = var_1736, gamma = norm4_1_weight, x = input_43)[name = tensor("x_9")]; tensor var_1768 = linear(bias = linear_1_bias_0, weight = attn4_in_proj_weight, x = x_9)[name = tensor("linear_17")]; tensor var_1772 = const()[name = tensor("op_1772"), val = tensor([1, 1, 3, 16, 64])]; tensor qkv_9 = reshape(shape = var_1772, x = var_1768)[name = tensor("qkv_9")]; tensor q_25_begin_0 = const()[name = tensor("q_25_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_25_end_0 = const()[name = tensor("q_25_end_0"), val = tensor([1, 1, 1, 16, 64])]; tensor q_25_end_mask_0 = const()[name = tensor("q_25_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_25_squeeze_mask_0 = const()[name = tensor("q_25_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_25 = slice_by_index(begin = q_25_begin_0, end = q_25_end_0, end_mask = q_25_end_mask_0, squeeze_mask = q_25_squeeze_mask_0, x = qkv_9)[name = tensor("q_25")]; tensor k_17_begin_0 = const()[name = tensor("k_17_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_17_end_0 = const()[name = tensor("k_17_end_0"), val = tensor([1, 1, 2, 16, 64])]; tensor k_17_end_mask_0 = const()[name = tensor("k_17_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_17_squeeze_mask_0 = const()[name = tensor("k_17_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_17 = slice_by_index(begin = k_17_begin_0, end = k_17_end_0, end_mask = k_17_end_mask_0, squeeze_mask = k_17_squeeze_mask_0, x = qkv_9)[name = tensor("k_17")]; tensor v_9_begin_0 = const()[name = tensor("v_9_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_9_end_0 = const()[name = tensor("v_9_end_0"), val = tensor([1, 1, 3, 16, 64])]; tensor v_9_end_mask_0 = const()[name = tensor("v_9_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_9_squeeze_mask_0 = const()[name = tensor("v_9_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v_9 = slice_by_index(begin = v_9_begin_0, end = v_9_end_0, end_mask = v_9_end_mask_0, squeeze_mask = v_9_squeeze_mask_0, x = qkv_9)[name = tensor("v_9")]; tensor freqs_9 = const()[name = tensor("freqs_9"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304368000)))]; tensor var_1876 = const()[name = tensor("op_1876"), val = tensor([1, 1, 1, 1])]; tensor ts_29 = reshape(shape = var_1876, x = position4)[name = tensor("ts_29")]; tensor var_1880 = const()[name = tensor("op_1880"), val = tensor([1, 1, 16, 32, 2])]; tensor q_complex_9 = reshape(shape = var_1880, x = q_25)[name = tensor("q_complex_9")]; tensor var_1884 = const()[name = tensor("op_1884"), val = tensor([1, 1, 16, 32, 2])]; tensor k_complex_9 = reshape(shape = var_1884, x = k_17)[name = tensor("k_complex_9")]; tensor var_1888_begin_0 = const()[name = tensor("op_1888_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1888_end_0 = const()[name = tensor("op_1888_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_1888_end_mask_0 = const()[name = tensor("op_1888_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1888_squeeze_mask_0 = const()[name = tensor("op_1888_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1888 = slice_by_index(begin = var_1888_begin_0, end = var_1888_end_0, end_mask = var_1888_end_mask_0, squeeze_mask = var_1888_squeeze_mask_0, x = q_complex_9)[name = tensor("op_1888")]; tensor var_1896_begin_0 = const()[name = tensor("op_1896_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_1896_end_0 = const()[name = tensor("op_1896_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_1896_end_mask_0 = const()[name = tensor("op_1896_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1896_squeeze_mask_0 = const()[name = tensor("op_1896_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1896 = slice_by_index(begin = var_1896_begin_0, end = var_1896_end_0, end_mask = var_1896_end_mask_0, squeeze_mask = var_1896_squeeze_mask_0, x = q_complex_9)[name = tensor("op_1896")]; tensor var_1904_begin_0 = const()[name = tensor("op_1904_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_1904_end_0 = const()[name = tensor("op_1904_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_1904_end_mask_0 = const()[name = tensor("op_1904_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1904_squeeze_mask_0 = const()[name = tensor("op_1904_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1904 = slice_by_index(begin = var_1904_begin_0, end = var_1904_end_0, end_mask = var_1904_end_mask_0, squeeze_mask = var_1904_squeeze_mask_0, x = k_complex_9)[name = tensor("op_1904")]; tensor var_1912_begin_0 = const()[name = tensor("op_1912_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_1912_end_0 = const()[name = tensor("op_1912_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_1912_end_mask_0 = const()[name = tensor("op_1912_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_1912_squeeze_mask_0 = const()[name = tensor("op_1912_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_1912 = slice_by_index(begin = var_1912_begin_0, end = var_1912_end_0, end_mask = var_1912_end_mask_0, squeeze_mask = var_1912_squeeze_mask_0, x = k_complex_9)[name = tensor("op_1912")]; tensor var_1918 = mul(x = freqs_9, y = ts_29)[name = tensor("op_1918")]; tensor rotr_9 = cos(x = var_1918)[name = tensor("rotr_9")]; tensor roti_9 = sin(x = var_1918)[name = tensor("roti_9")]; tensor var_1922 = mul(x = var_1888, y = rotr_9)[name = tensor("op_1922")]; tensor var_1923 = mul(x = var_1896, y = roti_9)[name = tensor("op_1923")]; tensor qor_17 = sub(x = var_1922, y = var_1923)[name = tensor("qor_17")]; tensor var_1926 = mul(x = var_1888, y = roti_9)[name = tensor("op_1926")]; tensor var_1927 = mul(x = var_1896, y = rotr_9)[name = tensor("op_1927")]; tensor qoi_17 = add(x = var_1926, y = var_1927)[name = tensor("qoi_17")]; tensor var_1930 = mul(x = var_1904, y = rotr_9)[name = tensor("op_1930")]; tensor var_1931 = mul(x = var_1912, y = roti_9)[name = tensor("op_1931")]; tensor kor_17 = sub(x = var_1930, y = var_1931)[name = tensor("kor_17")]; tensor var_1934 = mul(x = var_1904, y = roti_9)[name = tensor("op_1934")]; tensor var_1935 = mul(x = var_1912, y = rotr_9)[name = tensor("op_1935")]; tensor koi_17 = add(x = var_1934, y = var_1935)[name = tensor("koi_17")]; tensor qo_9_axis_0 = const()[name = tensor("qo_9_axis_0"), val = tensor(-1)]; tensor qo_9 = stack(axis = qo_9_axis_0, values = (qor_17, qoi_17))[name = tensor("qo_9")]; tensor ko_9_axis_0 = const()[name = tensor("ko_9_axis_0"), val = tensor(-1)]; tensor ko_9 = stack(axis = ko_9_axis_0, values = (kor_17, koi_17))[name = tensor("ko_9")]; tensor var_1964 = const()[name = tensor("op_1964"), val = tensor([1, 1, 16, 64])]; tensor q_27 = reshape(shape = var_1964, x = qo_9)[name = tensor("q_27")]; tensor var_1966 = const()[name = tensor("op_1966"), val = tensor([1, 1, 16, 64])]; tensor k_19 = reshape(shape = var_1966, x = ko_9)[name = tensor("k_19")]; tensor _inversed_1988_y_0 = const()[name = tensor("_inversed_1988_y_0"), val = tensor(0x1p-9)]; tensor _inversed_1988 = mul(x = ts_29, y = _inversed_1988_y_0)[name = tensor("_inversed_1988")]; tensor var_1989 = floor(x = _inversed_1988)[name = tensor("op_1989")]; tensor var_1990 = const()[name = tensor("op_1990"), val = tensor(0x1p+9)]; tensor var_1991 = mul(x = var_1989, y = var_1990)[name = tensor("op_1991")]; tensor write_indices_float_19 = sub(x = ts_29, y = var_1991)[name = tensor("write_indices_float_19")]; tensor var_1998_dtype_0 = const()[name = tensor("op_1998_dtype_0"), val = tensor("int32")]; tensor write_indices_9_reps_0 = const()[name = tensor("write_indices_9_reps_0"), val = tensor([1, 1, 16, 64])]; tensor var_1998 = cast(dtype = var_1998_dtype_0, x = write_indices_float_19)[name = tensor("cast_109")]; tensor write_indices_9 = tile(reps = write_indices_9_reps_0, x = var_1998)[name = tensor("write_indices_9")]; tensor var_2006_begin_0 = const()[name = tensor("op_2006_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_2006_end_0 = const()[name = tensor("op_2006_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor var_2006_end_mask_0 = const()[name = tensor("op_2006_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_2006_squeeze_mask_0 = const()[name = tensor("op_2006_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_2006 = slice_by_index(begin = var_2006_begin_0, end = var_2006_end_0, end_mask = var_2006_end_mask_0, squeeze_mask = var_2006_squeeze_mask_0, x = cache4)[name = tensor("op_2006")]; tensor var_2008_axis_0 = const()[name = tensor("op_2008_axis_0"), val = tensor(1)]; tensor var_2008_mode_0 = const()[name = tensor("op_2008_mode_0"), val = tensor("update")]; tensor var_2008_validate_indices_0 = const()[name = tensor("op_2008_validate_indices_0"), val = tensor(false)]; tensor var_2008 = scatter_along_axis(axis = var_2008_axis_0, data = var_2006, indices = write_indices_9, mode = var_2008_mode_0, updates = k_19, validate_indices = var_2008_validate_indices_0)[name = tensor("op_2008")]; tensor concat_30 = const()[name = tensor("concat_30"), val = tensor([0, 0, 0, 0, 0])]; tensor concat_31 = const()[name = tensor("concat_31"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_9_internal_tensor_assign_1_stride_0 = const()[name = tensor("new_cache_9_internal_tensor_assign_1_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_9_internal_tensor_assign_1_begin_mask_0 = const()[name = tensor("new_cache_9_internal_tensor_assign_1_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_9_internal_tensor_assign_1_end_mask_0 = const()[name = tensor("new_cache_9_internal_tensor_assign_1_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_9_internal_tensor_assign_1_squeeze_mask_0 = const()[name = tensor("new_cache_9_internal_tensor_assign_1_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_20 = const()[name = tensor("shape_20"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_8 = const()[name = tensor("reduce_prod_8"), val = tensor(1048576)]; tensor range_1d_8_start_0 = const()[name = tensor("range_1d_8_start_0"), val = tensor(0)]; tensor range_1d_8_step_0 = const()[name = tensor("range_1d_8_step_0"), val = tensor(1)]; tensor range_1d_8 = range_1d(end = reduce_prod_8, start = range_1d_8_start_0, step = range_1d_8_step_0)[name = tensor("range_1d_8")]; tensor reshape_40 = reshape(shape = shape_20, x = range_1d_8)[name = tensor("reshape_40")]; tensor slice_by_index_8 = slice_by_index(begin = concat_30, begin_mask = new_cache_9_internal_tensor_assign_1_begin_mask_0, end = concat_31, end_mask = new_cache_9_internal_tensor_assign_1_end_mask_0, squeeze_mask = new_cache_9_internal_tensor_assign_1_squeeze_mask_0, stride = new_cache_9_internal_tensor_assign_1_stride_0, x = reshape_40)[name = tensor("slice_by_index_8")]; tensor reshape_41_shape_0 = const()[name = tensor("reshape_41_shape_0"), val = tensor([-1])]; tensor reshape_41 = reshape(shape = reshape_41_shape_0, x = slice_by_index_8)[name = tensor("reshape_41")]; tensor reshape_42_shape_0 = const()[name = tensor("reshape_42_shape_0"), val = tensor([-1])]; tensor reshape_42 = reshape(shape = reshape_42_shape_0, x = var_2008)[name = tensor("reshape_42")]; tensor reshape_43_shape_0 = const()[name = tensor("reshape_43_shape_0"), val = tensor([-1])]; tensor reshape_43 = reshape(shape = reshape_43_shape_0, x = cache4)[name = tensor("reshape_43")]; tensor scatter_8_mode_0 = const()[name = tensor("scatter_8_mode_0"), val = tensor("update")]; tensor scatter_8_axis_0 = const()[name = tensor("scatter_8_axis_0"), val = tensor(0)]; tensor scatter_8_validate_indices_0 = const()[name = tensor("scatter_8_validate_indices_0"), val = tensor(false)]; tensor scatter_8 = scatter(axis = scatter_8_axis_0, data = reshape_43, indices = reshape_41, mode = scatter_8_mode_0, updates = reshape_42, validate_indices = scatter_8_validate_indices_0)[name = tensor("scatter_8")]; tensor reshape_44 = reshape(shape = shape_20, x = scatter_8)[name = tensor("reshape_44")]; tensor var_2016_begin_0 = const()[name = tensor("op_2016_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor var_2016_end_0 = const()[name = tensor("op_2016_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor var_2016_end_mask_0 = const()[name = tensor("op_2016_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_2016_squeeze_mask_0 = const()[name = tensor("op_2016_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_2016 = slice_by_index(begin = var_2016_begin_0, end = var_2016_end_0, end_mask = var_2016_end_mask_0, squeeze_mask = var_2016_squeeze_mask_0, x = reshape_44)[name = tensor("op_2016")]; tensor var_2018_axis_0 = const()[name = tensor("op_2018_axis_0"), val = tensor(1)]; tensor var_2018_mode_0 = const()[name = tensor("op_2018_mode_0"), val = tensor("update")]; tensor var_2018_validate_indices_0 = const()[name = tensor("op_2018_validate_indices_0"), val = tensor(false)]; tensor var_2018 = scatter_along_axis(axis = var_2018_axis_0, data = var_2016, indices = write_indices_9, mode = var_2018_mode_0, updates = v_9, validate_indices = var_2018_validate_indices_0)[name = tensor("op_2018")]; tensor concat_32 = const()[name = tensor("concat_32"), val = tensor([1, 0, 0, 0, 0])]; tensor concat_33 = const()[name = tensor("concat_33"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_9_internal_tensor_assign_2_stride_0 = const()[name = tensor("new_cache_9_internal_tensor_assign_2_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_9_internal_tensor_assign_2_begin_mask_0 = const()[name = tensor("new_cache_9_internal_tensor_assign_2_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_9_internal_tensor_assign_2_end_mask_0 = const()[name = tensor("new_cache_9_internal_tensor_assign_2_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_9_internal_tensor_assign_2_squeeze_mask_0 = const()[name = tensor("new_cache_9_internal_tensor_assign_2_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_21 = const()[name = tensor("shape_21"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_9 = const()[name = tensor("reduce_prod_9"), val = tensor(1048576)]; tensor range_1d_9_start_0 = const()[name = tensor("range_1d_9_start_0"), val = tensor(0)]; tensor range_1d_9_step_0 = const()[name = tensor("range_1d_9_step_0"), val = tensor(1)]; tensor range_1d_9 = range_1d(end = reduce_prod_9, start = range_1d_9_start_0, step = range_1d_9_step_0)[name = tensor("range_1d_9")]; tensor reshape_45 = reshape(shape = shape_21, x = range_1d_9)[name = tensor("reshape_45")]; tensor slice_by_index_9 = slice_by_index(begin = concat_32, begin_mask = new_cache_9_internal_tensor_assign_2_begin_mask_0, end = concat_33, end_mask = new_cache_9_internal_tensor_assign_2_end_mask_0, squeeze_mask = new_cache_9_internal_tensor_assign_2_squeeze_mask_0, stride = new_cache_9_internal_tensor_assign_2_stride_0, x = reshape_45)[name = tensor("slice_by_index_9")]; tensor reshape_46_shape_0 = const()[name = tensor("reshape_46_shape_0"), val = tensor([-1])]; tensor reshape_46 = reshape(shape = reshape_46_shape_0, x = slice_by_index_9)[name = tensor("reshape_46")]; tensor reshape_47_shape_0 = const()[name = tensor("reshape_47_shape_0"), val = tensor([-1])]; tensor reshape_47 = reshape(shape = reshape_47_shape_0, x = var_2018)[name = tensor("reshape_47")]; tensor reshape_48_shape_0 = const()[name = tensor("reshape_48_shape_0"), val = tensor([-1])]; tensor reshape_48 = reshape(shape = reshape_48_shape_0, x = reshape_44)[name = tensor("reshape_48")]; tensor scatter_9_mode_0 = const()[name = tensor("scatter_9_mode_0"), val = tensor("update")]; tensor scatter_9_axis_0 = const()[name = tensor("scatter_9_axis_0"), val = tensor(0)]; tensor scatter_9_validate_indices_0 = const()[name = tensor("scatter_9_validate_indices_0"), val = tensor(false)]; tensor scatter_9 = scatter(axis = scatter_9_axis_0, data = reshape_48, indices = reshape_46, mode = scatter_9_mode_0, updates = reshape_47, validate_indices = scatter_9_validate_indices_0)[name = tensor("scatter_9")]; tensor new_cache_9_internal_tensor_assign_2 = reshape(shape = shape_21, x = scatter_9)[name = tensor("reshape_49")]; tensor keys_25_begin_0 = const()[name = tensor("keys_25_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor keys_25_end_0 = const()[name = tensor("keys_25_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor keys_25_end_mask_0 = const()[name = tensor("keys_25_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor keys_25_squeeze_mask_0 = const()[name = tensor("keys_25_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor keys_25 = slice_by_index(begin = keys_25_begin_0, end = keys_25_end_0, end_mask = keys_25_end_mask_0, squeeze_mask = keys_25_squeeze_mask_0, x = new_cache_9_internal_tensor_assign_2)[name = tensor("keys_25")]; tensor values_25_begin_0 = const()[name = tensor("values_25_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor values_25_end_0 = const()[name = tensor("values_25_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor values_25_end_mask_0 = const()[name = tensor("values_25_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor values_25_squeeze_mask_0 = const()[name = tensor("values_25_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor values_25 = slice_by_index(begin = values_25_begin_0, end = values_25_end_0, end_mask = values_25_end_mask_0, squeeze_mask = values_25_squeeze_mask_0, x = new_cache_9_internal_tensor_assign_2)[name = tensor("values_25")]; tensor var_2030 = not_equal(x = keys_25, y = keys_25)[name = tensor("op_2030")]; tensor keys_27 = select(a = var_360, b = keys_25, cond = var_2030)[name = tensor("keys_27")]; tensor var_2038 = not_equal(x = values_25, y = values_25)[name = tensor("op_2038")]; tensor values_27 = select(a = var_360, b = values_25, cond = var_2038)[name = tensor("values_27")]; tensor var_2062 = const()[name = tensor("op_2062"), val = tensor([0, 2, 1, 3])]; tensor var_2075 = const()[name = tensor("op_2075"), val = tensor([1, 1, 1])]; tensor var_2076 = reshape(shape = var_2075, x = position4)[name = tensor("op_2076")]; tensor var_2093 = const()[name = tensor("op_2093"), val = tensor(0x1p+0)]; tensor valid_len_9 = add(x = var_2076, y = var_2093)[name = tensor("valid_len_9")]; tensor valid_mask_9 = less(x = k_positions_1_promoted, y = valid_len_9)[name = tensor("valid_mask_9")]; tensor causal_mask_9 = less_equal(x = k_positions_1_promoted, y = var_2076)[name = tensor("causal_mask_9")]; tensor attn_mask_17 = logical_and(x = valid_mask_9, y = causal_mask_9)[name = tensor("attn_mask_17")]; tensor attn_mask_19_axes_0 = const()[name = tensor("attn_mask_19_axes_0"), val = tensor([1])]; tensor attn_mask_19 = expand_dims(axes = attn_mask_19_axes_0, x = attn_mask_17)[name = tensor("attn_mask_19")]; tensor var_2105 = const()[name = tensor("op_2105"), val = tensor([0x1.fffe5cp-4])]; tensor var_2111_transpose_x_0 = const()[name = tensor("op_2111_transpose_x_0"), val = tensor(false)]; tensor var_2111_transpose_y_0 = const()[name = tensor("op_2111_transpose_y_0"), val = tensor(false)]; tensor transpose_26_perm_0 = const()[name = tensor("transpose_26_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_27_perm_0 = const()[name = tensor("transpose_27_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_27 = transpose(perm = transpose_27_perm_0, x = keys_27)[name = tensor("transpose_35")]; tensor transpose_26 = transpose(perm = transpose_26_perm_0, x = q_27)[name = tensor("transpose_36")]; tensor var_2111 = matmul(transpose_x = var_2111_transpose_x_0, transpose_y = var_2111_transpose_y_0, x = transpose_26, y = transpose_27)[name = tensor("op_2111")]; tensor attn_weights_25 = mul(x = var_2111, y = var_2105)[name = tensor("attn_weights_25")]; tensor var_2113 = logical_not(x = attn_mask_19)[name = tensor("op_2113")]; tensor var_2114 = const()[name = tensor("op_2114"), val = tensor(-0x1.ff933cp+127)]; tensor attn_weights_27 = select(a = var_2114, b = attn_weights_25, cond = var_2113)[name = tensor("attn_weights_27")]; tensor var_2116 = const()[name = tensor("op_2116"), val = tensor(-1)]; tensor attn_weights_29 = softmax(axis = var_2116, x = attn_weights_27)[name = tensor("attn_weights_29")]; tensor attn_output_9_transpose_x_0 = const()[name = tensor("attn_output_9_transpose_x_0"), val = tensor(false)]; tensor attn_output_9_transpose_y_0 = const()[name = tensor("attn_output_9_transpose_y_0"), val = tensor(false)]; tensor values_29 = transpose(perm = var_2062, x = values_27)[name = tensor("transpose_37")]; tensor attn_output_9 = matmul(transpose_x = attn_output_9_transpose_x_0, transpose_y = attn_output_9_transpose_y_0, x = attn_weights_29, y = values_29)[name = tensor("attn_output_9")]; tensor var_2124 = const()[name = tensor("op_2124"), val = tensor([0, 2, 1, 3])]; tensor var_2127 = const()[name = tensor("op_2127"), val = tensor([1, 1, 1024])]; tensor var_2125 = transpose(perm = var_2124, x = attn_output_9)[name = tensor("transpose_34")]; tensor input_45 = reshape(shape = var_2127, x = var_2125)[name = tensor("input_45")]; tensor attn_out_9 = linear(bias = linear_0_bias_0, weight = attn4_out_proj_weight, x = input_45)[name = tensor("linear_18")]; tensor var_2133 = const()[name = tensor("op_2133"), val = tensor(0x1p+0)]; tensor var_2134 = add(x = position4, y = var_2133)[name = tensor("op_2134")]; tensor input_47 = add(x = input_43, y = attn_out_9)[name = tensor("input_47")]; tensor var_2138 = const()[name = tensor("op_2138"), val = tensor(0x1.4f8b58p-17)]; tensor input_49_axes_0 = const()[name = tensor("input_49_axes_0"), val = tensor([-1])]; tensor input_49 = layer_norm(axes = input_49_axes_0, beta = norm4_2_bias, epsilon = var_2138, gamma = norm4_2_weight, x = input_47)[name = tensor("input_49")]; tensor var_2146 = linear(bias = linear_3_bias_0, weight = linear4_1_weight, x = input_49)[name = tensor("linear_19")]; tensor input_51_mode_0 = const()[name = tensor("input_51_mode_0"), val = tensor("EXACT")]; tensor input_51 = gelu(mode = input_51_mode_0, x = var_2146)[name = tensor("input_51")]; tensor ffn_out_9 = linear(bias = linear_0_bias_0, weight = linear4_2_weight, x = input_51)[name = tensor("linear_20")]; tensor input_53 = add(x = input_47, y = ffn_out_9)[name = tensor("input_53")]; tensor var_2155 = const()[name = tensor("op_2155"), val = tensor(0x1.4f8b58p-17)]; tensor x_axes_0 = const()[name = tensor("x_axes_0"), val = tensor([-1])]; tensor x = layer_norm(axes = x_axes_0, beta = norm5_1_bias, epsilon = var_2155, gamma = norm5_1_weight, x = input_53)[name = tensor("x")]; tensor var_2187 = linear(bias = linear_1_bias_0, weight = attn5_in_proj_weight, x = x)[name = tensor("linear_21")]; tensor var_2191 = const()[name = tensor("op_2191"), val = tensor([1, 1, 3, 16, 64])]; tensor qkv = reshape(shape = var_2191, x = var_2187)[name = tensor("qkv")]; tensor q_31_begin_0 = const()[name = tensor("q_31_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor q_31_end_0 = const()[name = tensor("q_31_end_0"), val = tensor([1, 1, 1, 16, 64])]; tensor q_31_end_mask_0 = const()[name = tensor("q_31_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor q_31_squeeze_mask_0 = const()[name = tensor("q_31_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor q_31 = slice_by_index(begin = q_31_begin_0, end = q_31_end_0, end_mask = q_31_end_mask_0, squeeze_mask = q_31_squeeze_mask_0, x = qkv)[name = tensor("q_31")]; tensor k_21_begin_0 = const()[name = tensor("k_21_begin_0"), val = tensor([0, 0, 1, 0, 0])]; tensor k_21_end_0 = const()[name = tensor("k_21_end_0"), val = tensor([1, 1, 2, 16, 64])]; tensor k_21_end_mask_0 = const()[name = tensor("k_21_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor k_21_squeeze_mask_0 = const()[name = tensor("k_21_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor k_21 = slice_by_index(begin = k_21_begin_0, end = k_21_end_0, end_mask = k_21_end_mask_0, squeeze_mask = k_21_squeeze_mask_0, x = qkv)[name = tensor("k_21")]; tensor v_begin_0 = const()[name = tensor("v_begin_0"), val = tensor([0, 0, 2, 0, 0])]; tensor v_end_0 = const()[name = tensor("v_end_0"), val = tensor([1, 1, 3, 16, 64])]; tensor v_end_mask_0 = const()[name = tensor("v_end_mask_0"), val = tensor([true, true, false, true, true])]; tensor v_squeeze_mask_0 = const()[name = tensor("v_squeeze_mask_0"), val = tensor([false, false, true, false, false])]; tensor v = slice_by_index(begin = v_begin_0, end = v_end_0, end_mask = v_end_mask_0, squeeze_mask = v_squeeze_mask_0, x = qkv)[name = tensor("v")]; tensor freqs = const()[name = tensor("freqs"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(304368192)))]; tensor var_2295 = const()[name = tensor("op_2295"), val = tensor([1, 1, 1, 1])]; tensor ts = reshape(shape = var_2295, x = position5)[name = tensor("ts")]; tensor var_2299 = const()[name = tensor("op_2299"), val = tensor([1, 1, 16, 32, 2])]; tensor q_complex = reshape(shape = var_2299, x = q_31)[name = tensor("q_complex")]; tensor var_2303 = const()[name = tensor("op_2303"), val = tensor([1, 1, 16, 32, 2])]; tensor k_complex = reshape(shape = var_2303, x = k_21)[name = tensor("k_complex")]; tensor var_2307_begin_0 = const()[name = tensor("op_2307_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_2307_end_0 = const()[name = tensor("op_2307_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_2307_end_mask_0 = const()[name = tensor("op_2307_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_2307_squeeze_mask_0 = const()[name = tensor("op_2307_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_2307 = slice_by_index(begin = var_2307_begin_0, end = var_2307_end_0, end_mask = var_2307_end_mask_0, squeeze_mask = var_2307_squeeze_mask_0, x = q_complex)[name = tensor("op_2307")]; tensor var_2315_begin_0 = const()[name = tensor("op_2315_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_2315_end_0 = const()[name = tensor("op_2315_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_2315_end_mask_0 = const()[name = tensor("op_2315_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_2315_squeeze_mask_0 = const()[name = tensor("op_2315_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_2315 = slice_by_index(begin = var_2315_begin_0, end = var_2315_end_0, end_mask = var_2315_end_mask_0, squeeze_mask = var_2315_squeeze_mask_0, x = q_complex)[name = tensor("op_2315")]; tensor var_2323_begin_0 = const()[name = tensor("op_2323_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_2323_end_0 = const()[name = tensor("op_2323_end_0"), val = tensor([1, 1, 16, 32, 1])]; tensor var_2323_end_mask_0 = const()[name = tensor("op_2323_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_2323_squeeze_mask_0 = const()[name = tensor("op_2323_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_2323 = slice_by_index(begin = var_2323_begin_0, end = var_2323_end_0, end_mask = var_2323_end_mask_0, squeeze_mask = var_2323_squeeze_mask_0, x = k_complex)[name = tensor("op_2323")]; tensor var_2331_begin_0 = const()[name = tensor("op_2331_begin_0"), val = tensor([0, 0, 0, 0, 1])]; tensor var_2331_end_0 = const()[name = tensor("op_2331_end_0"), val = tensor([1, 1, 16, 32, 2])]; tensor var_2331_end_mask_0 = const()[name = tensor("op_2331_end_mask_0"), val = tensor([true, true, true, true, false])]; tensor var_2331_squeeze_mask_0 = const()[name = tensor("op_2331_squeeze_mask_0"), val = tensor([false, false, false, false, true])]; tensor var_2331 = slice_by_index(begin = var_2331_begin_0, end = var_2331_end_0, end_mask = var_2331_end_mask_0, squeeze_mask = var_2331_squeeze_mask_0, x = k_complex)[name = tensor("op_2331")]; tensor var_2337 = mul(x = freqs, y = ts)[name = tensor("op_2337")]; tensor rotr = cos(x = var_2337)[name = tensor("rotr")]; tensor roti = sin(x = var_2337)[name = tensor("roti")]; tensor var_2341 = mul(x = var_2307, y = rotr)[name = tensor("op_2341")]; tensor var_2342 = mul(x = var_2315, y = roti)[name = tensor("op_2342")]; tensor qor_21 = sub(x = var_2341, y = var_2342)[name = tensor("qor_21")]; tensor var_2345 = mul(x = var_2307, y = roti)[name = tensor("op_2345")]; tensor var_2346 = mul(x = var_2315, y = rotr)[name = tensor("op_2346")]; tensor qoi_21 = add(x = var_2345, y = var_2346)[name = tensor("qoi_21")]; tensor var_2349 = mul(x = var_2323, y = rotr)[name = tensor("op_2349")]; tensor var_2350 = mul(x = var_2331, y = roti)[name = tensor("op_2350")]; tensor kor_21 = sub(x = var_2349, y = var_2350)[name = tensor("kor_21")]; tensor var_2353 = mul(x = var_2323, y = roti)[name = tensor("op_2353")]; tensor var_2354 = mul(x = var_2331, y = rotr)[name = tensor("op_2354")]; tensor koi_21 = add(x = var_2353, y = var_2354)[name = tensor("koi_21")]; tensor qo_axis_0 = const()[name = tensor("qo_axis_0"), val = tensor(-1)]; tensor qo = stack(axis = qo_axis_0, values = (qor_21, qoi_21))[name = tensor("qo")]; tensor ko_axis_0 = const()[name = tensor("ko_axis_0"), val = tensor(-1)]; tensor ko = stack(axis = ko_axis_0, values = (kor_21, koi_21))[name = tensor("ko")]; tensor var_2383 = const()[name = tensor("op_2383"), val = tensor([1, 1, 16, 64])]; tensor q_33 = reshape(shape = var_2383, x = qo)[name = tensor("q_33")]; tensor var_2385 = const()[name = tensor("op_2385"), val = tensor([1, 1, 16, 64])]; tensor k = reshape(shape = var_2385, x = ko)[name = tensor("k")]; tensor _inversed_2407_y_0 = const()[name = tensor("_inversed_2407_y_0"), val = tensor(0x1p-9)]; tensor _inversed_2407 = mul(x = ts, y = _inversed_2407_y_0)[name = tensor("_inversed_2407")]; tensor var_2408 = floor(x = _inversed_2407)[name = tensor("op_2408")]; tensor var_2409 = const()[name = tensor("op_2409"), val = tensor(0x1p+9)]; tensor var_2410 = mul(x = var_2408, y = var_2409)[name = tensor("op_2410")]; tensor write_indices_float = sub(x = ts, y = var_2410)[name = tensor("write_indices_float")]; tensor var_2417_dtype_0 = const()[name = tensor("op_2417_dtype_0"), val = tensor("int32")]; tensor write_indices_reps_0 = const()[name = tensor("write_indices_reps_0"), val = tensor([1, 1, 16, 64])]; tensor var_2417 = cast(dtype = var_2417_dtype_0, x = write_indices_float)[name = tensor("cast_108")]; tensor write_indices = tile(reps = write_indices_reps_0, x = var_2417)[name = tensor("write_indices")]; tensor var_2425_begin_0 = const()[name = tensor("op_2425_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor var_2425_end_0 = const()[name = tensor("op_2425_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor var_2425_end_mask_0 = const()[name = tensor("op_2425_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_2425_squeeze_mask_0 = const()[name = tensor("op_2425_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_2425 = slice_by_index(begin = var_2425_begin_0, end = var_2425_end_0, end_mask = var_2425_end_mask_0, squeeze_mask = var_2425_squeeze_mask_0, x = cache5)[name = tensor("op_2425")]; tensor var_2427_axis_0 = const()[name = tensor("op_2427_axis_0"), val = tensor(1)]; tensor var_2427_mode_0 = const()[name = tensor("op_2427_mode_0"), val = tensor("update")]; tensor var_2427_validate_indices_0 = const()[name = tensor("op_2427_validate_indices_0"), val = tensor(false)]; tensor var_2427 = scatter_along_axis(axis = var_2427_axis_0, data = var_2425, indices = write_indices, mode = var_2427_mode_0, updates = k, validate_indices = var_2427_validate_indices_0)[name = tensor("op_2427")]; tensor concat_37 = const()[name = tensor("concat_37"), val = tensor([0, 0, 0, 0, 0])]; tensor concat_38 = const()[name = tensor("concat_38"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_internal_tensor_assign_1_stride_0 = const()[name = tensor("new_cache_internal_tensor_assign_1_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_internal_tensor_assign_1_begin_mask_0 = const()[name = tensor("new_cache_internal_tensor_assign_1_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_internal_tensor_assign_1_end_mask_0 = const()[name = tensor("new_cache_internal_tensor_assign_1_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_internal_tensor_assign_1_squeeze_mask_0 = const()[name = tensor("new_cache_internal_tensor_assign_1_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_22 = const()[name = tensor("shape_22"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_10 = const()[name = tensor("reduce_prod_10"), val = tensor(1048576)]; tensor range_1d_10_start_0 = const()[name = tensor("range_1d_10_start_0"), val = tensor(0)]; tensor range_1d_10_step_0 = const()[name = tensor("range_1d_10_step_0"), val = tensor(1)]; tensor range_1d_10 = range_1d(end = reduce_prod_10, start = range_1d_10_start_0, step = range_1d_10_step_0)[name = tensor("range_1d_10")]; tensor reshape_50 = reshape(shape = shape_22, x = range_1d_10)[name = tensor("reshape_50")]; tensor slice_by_index_10 = slice_by_index(begin = concat_37, begin_mask = new_cache_internal_tensor_assign_1_begin_mask_0, end = concat_38, end_mask = new_cache_internal_tensor_assign_1_end_mask_0, squeeze_mask = new_cache_internal_tensor_assign_1_squeeze_mask_0, stride = new_cache_internal_tensor_assign_1_stride_0, x = reshape_50)[name = tensor("slice_by_index_10")]; tensor reshape_51_shape_0 = const()[name = tensor("reshape_51_shape_0"), val = tensor([-1])]; tensor reshape_51 = reshape(shape = reshape_51_shape_0, x = slice_by_index_10)[name = tensor("reshape_51")]; tensor reshape_52_shape_0 = const()[name = tensor("reshape_52_shape_0"), val = tensor([-1])]; tensor reshape_52 = reshape(shape = reshape_52_shape_0, x = var_2427)[name = tensor("reshape_52")]; tensor reshape_53_shape_0 = const()[name = tensor("reshape_53_shape_0"), val = tensor([-1])]; tensor reshape_53 = reshape(shape = reshape_53_shape_0, x = cache5)[name = tensor("reshape_53")]; tensor scatter_10_mode_0 = const()[name = tensor("scatter_10_mode_0"), val = tensor("update")]; tensor scatter_10_axis_0 = const()[name = tensor("scatter_10_axis_0"), val = tensor(0)]; tensor scatter_10_validate_indices_0 = const()[name = tensor("scatter_10_validate_indices_0"), val = tensor(false)]; tensor scatter_10 = scatter(axis = scatter_10_axis_0, data = reshape_53, indices = reshape_51, mode = scatter_10_mode_0, updates = reshape_52, validate_indices = scatter_10_validate_indices_0)[name = tensor("scatter_10")]; tensor reshape_54 = reshape(shape = shape_22, x = scatter_10)[name = tensor("reshape_54")]; tensor var_2435_begin_0 = const()[name = tensor("op_2435_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor var_2435_end_0 = const()[name = tensor("op_2435_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor var_2435_end_mask_0 = const()[name = tensor("op_2435_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor var_2435_squeeze_mask_0 = const()[name = tensor("op_2435_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor var_2435 = slice_by_index(begin = var_2435_begin_0, end = var_2435_end_0, end_mask = var_2435_end_mask_0, squeeze_mask = var_2435_squeeze_mask_0, x = reshape_54)[name = tensor("op_2435")]; tensor var_2437_axis_0 = const()[name = tensor("op_2437_axis_0"), val = tensor(1)]; tensor var_2437_mode_0 = const()[name = tensor("op_2437_mode_0"), val = tensor("update")]; tensor var_2437_validate_indices_0 = const()[name = tensor("op_2437_validate_indices_0"), val = tensor(false)]; tensor var_2437 = scatter_along_axis(axis = var_2437_axis_0, data = var_2435, indices = write_indices, mode = var_2437_mode_0, updates = v, validate_indices = var_2437_validate_indices_0)[name = tensor("op_2437")]; tensor concat_39 = const()[name = tensor("concat_39"), val = tensor([1, 0, 0, 0, 0])]; tensor concat_40 = const()[name = tensor("concat_40"), val = tensor([0, 0, 0, 0, 0])]; tensor new_cache_internal_tensor_assign_2_stride_0 = const()[name = tensor("new_cache_internal_tensor_assign_2_stride_0"), val = tensor([1, 1, 1, 1, 1])]; tensor new_cache_internal_tensor_assign_2_begin_mask_0 = const()[name = tensor("new_cache_internal_tensor_assign_2_begin_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_internal_tensor_assign_2_end_mask_0 = const()[name = tensor("new_cache_internal_tensor_assign_2_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor new_cache_internal_tensor_assign_2_squeeze_mask_0 = const()[name = tensor("new_cache_internal_tensor_assign_2_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor shape_23 = const()[name = tensor("shape_23"), val = tensor([2, 1, 512, 16, 64])]; tensor reduce_prod_11 = const()[name = tensor("reduce_prod_11"), val = tensor(1048576)]; tensor range_1d_11_start_0 = const()[name = tensor("range_1d_11_start_0"), val = tensor(0)]; tensor range_1d_11_step_0 = const()[name = tensor("range_1d_11_step_0"), val = tensor(1)]; tensor range_1d_11 = range_1d(end = reduce_prod_11, start = range_1d_11_start_0, step = range_1d_11_step_0)[name = tensor("range_1d_11")]; tensor reshape_55 = reshape(shape = shape_23, x = range_1d_11)[name = tensor("reshape_55")]; tensor slice_by_index_11 = slice_by_index(begin = concat_39, begin_mask = new_cache_internal_tensor_assign_2_begin_mask_0, end = concat_40, end_mask = new_cache_internal_tensor_assign_2_end_mask_0, squeeze_mask = new_cache_internal_tensor_assign_2_squeeze_mask_0, stride = new_cache_internal_tensor_assign_2_stride_0, x = reshape_55)[name = tensor("slice_by_index_11")]; tensor reshape_56_shape_0 = const()[name = tensor("reshape_56_shape_0"), val = tensor([-1])]; tensor reshape_56 = reshape(shape = reshape_56_shape_0, x = slice_by_index_11)[name = tensor("reshape_56")]; tensor reshape_57_shape_0 = const()[name = tensor("reshape_57_shape_0"), val = tensor([-1])]; tensor reshape_57 = reshape(shape = reshape_57_shape_0, x = var_2437)[name = tensor("reshape_57")]; tensor reshape_58_shape_0 = const()[name = tensor("reshape_58_shape_0"), val = tensor([-1])]; tensor reshape_58 = reshape(shape = reshape_58_shape_0, x = reshape_54)[name = tensor("reshape_58")]; tensor scatter_11_mode_0 = const()[name = tensor("scatter_11_mode_0"), val = tensor("update")]; tensor scatter_11_axis_0 = const()[name = tensor("scatter_11_axis_0"), val = tensor(0)]; tensor scatter_11_validate_indices_0 = const()[name = tensor("scatter_11_validate_indices_0"), val = tensor(false)]; tensor scatter_11 = scatter(axis = scatter_11_axis_0, data = reshape_58, indices = reshape_56, mode = scatter_11_mode_0, updates = reshape_57, validate_indices = scatter_11_validate_indices_0)[name = tensor("scatter_11")]; tensor new_cache_internal_tensor_assign_2 = reshape(shape = shape_23, x = scatter_11)[name = tensor("reshape_59")]; tensor keys_31_begin_0 = const()[name = tensor("keys_31_begin_0"), val = tensor([0, 0, 0, 0, 0])]; tensor keys_31_end_0 = const()[name = tensor("keys_31_end_0"), val = tensor([1, 1, 512, 16, 64])]; tensor keys_31_end_mask_0 = const()[name = tensor("keys_31_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor keys_31_squeeze_mask_0 = const()[name = tensor("keys_31_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor keys_31 = slice_by_index(begin = keys_31_begin_0, end = keys_31_end_0, end_mask = keys_31_end_mask_0, squeeze_mask = keys_31_squeeze_mask_0, x = new_cache_internal_tensor_assign_2)[name = tensor("keys_31")]; tensor values_31_begin_0 = const()[name = tensor("values_31_begin_0"), val = tensor([1, 0, 0, 0, 0])]; tensor values_31_end_0 = const()[name = tensor("values_31_end_0"), val = tensor([2, 1, 512, 16, 64])]; tensor values_31_end_mask_0 = const()[name = tensor("values_31_end_mask_0"), val = tensor([false, true, true, true, true])]; tensor values_31_squeeze_mask_0 = const()[name = tensor("values_31_squeeze_mask_0"), val = tensor([true, false, false, false, false])]; tensor values_31 = slice_by_index(begin = values_31_begin_0, end = values_31_end_0, end_mask = values_31_end_mask_0, squeeze_mask = values_31_squeeze_mask_0, x = new_cache_internal_tensor_assign_2)[name = tensor("values_31")]; tensor var_2449 = not_equal(x = keys_31, y = keys_31)[name = tensor("op_2449")]; tensor keys_33 = select(a = var_360, b = keys_31, cond = var_2449)[name = tensor("keys_33")]; tensor var_2457 = not_equal(x = values_31, y = values_31)[name = tensor("op_2457")]; tensor values_33 = select(a = var_360, b = values_31, cond = var_2457)[name = tensor("values_33")]; tensor var_2481 = const()[name = tensor("op_2481"), val = tensor([0, 2, 1, 3])]; tensor var_2494 = const()[name = tensor("op_2494"), val = tensor([1, 1, 1])]; tensor var_2495 = reshape(shape = var_2494, x = position5)[name = tensor("op_2495")]; tensor var_2512 = const()[name = tensor("op_2512"), val = tensor(0x1p+0)]; tensor valid_len = add(x = var_2495, y = var_2512)[name = tensor("valid_len")]; tensor valid_mask = less(x = k_positions_1_promoted, y = valid_len)[name = tensor("valid_mask")]; tensor causal_mask = less_equal(x = k_positions_1_promoted, y = var_2495)[name = tensor("causal_mask")]; tensor attn_mask_21 = logical_and(x = valid_mask, y = causal_mask)[name = tensor("attn_mask_21")]; tensor attn_mask_axes_0 = const()[name = tensor("attn_mask_axes_0"), val = tensor([1])]; tensor attn_mask = expand_dims(axes = attn_mask_axes_0, x = attn_mask_21)[name = tensor("attn_mask")]; tensor var_2524 = const()[name = tensor("op_2524"), val = tensor([0x1.fffe5cp-4])]; tensor var_2530_transpose_x_0 = const()[name = tensor("op_2530_transpose_x_0"), val = tensor(false)]; tensor var_2530_transpose_y_0 = const()[name = tensor("op_2530_transpose_y_0"), val = tensor(false)]; tensor transpose_28_perm_0 = const()[name = tensor("transpose_28_perm_0"), val = tensor([0, 2, -3, -1])]; tensor transpose_29_perm_0 = const()[name = tensor("transpose_29_perm_0"), val = tensor([0, 2, -1, -3])]; tensor transpose_29 = transpose(perm = transpose_29_perm_0, x = keys_33)[name = tensor("transpose_31")]; tensor transpose_28 = transpose(perm = transpose_28_perm_0, x = q_33)[name = tensor("transpose_32")]; tensor var_2530 = matmul(transpose_x = var_2530_transpose_x_0, transpose_y = var_2530_transpose_y_0, x = transpose_28, y = transpose_29)[name = tensor("op_2530")]; tensor attn_weights_31 = mul(x = var_2530, y = var_2524)[name = tensor("attn_weights_31")]; tensor var_2532 = logical_not(x = attn_mask)[name = tensor("op_2532")]; tensor var_2533 = const()[name = tensor("op_2533"), val = tensor(-0x1.ff933cp+127)]; tensor attn_weights_33 = select(a = var_2533, b = attn_weights_31, cond = var_2532)[name = tensor("attn_weights_33")]; tensor var_2535 = const()[name = tensor("op_2535"), val = tensor(-1)]; tensor attn_weights = softmax(axis = var_2535, x = attn_weights_33)[name = tensor("attn_weights")]; tensor attn_output_transpose_x_0 = const()[name = tensor("attn_output_transpose_x_0"), val = tensor(false)]; tensor attn_output_transpose_y_0 = const()[name = tensor("attn_output_transpose_y_0"), val = tensor(false)]; tensor values = transpose(perm = var_2481, x = values_33)[name = tensor("transpose_33")]; tensor attn_output = matmul(transpose_x = attn_output_transpose_x_0, transpose_y = attn_output_transpose_y_0, x = attn_weights, y = values)[name = tensor("attn_output")]; tensor var_2543 = const()[name = tensor("op_2543"), val = tensor([0, 2, 1, 3])]; tensor var_2546 = const()[name = tensor("op_2546"), val = tensor([1, 1, 1024])]; tensor var_2544 = transpose(perm = var_2543, x = attn_output)[name = tensor("transpose_30")]; tensor input_55 = reshape(shape = var_2546, x = var_2544)[name = tensor("input_55")]; tensor attn_out = linear(bias = linear_0_bias_0, weight = attn5_out_proj_weight, x = input_55)[name = tensor("linear_22")]; tensor var_2552 = const()[name = tensor("op_2552"), val = tensor(0x1p+0)]; tensor var_2553 = add(x = position5, y = var_2552)[name = tensor("op_2553")]; tensor input_57 = add(x = input_53, y = attn_out)[name = tensor("input_57")]; tensor var_2557 = const()[name = tensor("op_2557"), val = tensor(0x1.4f8b58p-17)]; tensor input_59_axes_0 = const()[name = tensor("input_59_axes_0"), val = tensor([-1])]; tensor input_59 = layer_norm(axes = input_59_axes_0, beta = norm5_2_bias, epsilon = var_2557, gamma = norm5_2_weight, x = input_57)[name = tensor("input_59")]; tensor var_2565 = linear(bias = linear_3_bias_0, weight = linear5_1_weight, x = input_59)[name = tensor("linear_23")]; tensor input_61_mode_0 = const()[name = tensor("input_61_mode_0"), val = tensor("EXACT")]; tensor input_61 = gelu(mode = input_61_mode_0, x = var_2565)[name = tensor("input_61")]; tensor ffn_out = linear(bias = linear_0_bias_0, weight = linear5_2_weight, x = input_61)[name = tensor("linear_24")]; tensor input_63 = add(x = input_57, y = ffn_out)[name = tensor("input_63")]; tensor var_2574 = const()[name = tensor("op_2574"), val = tensor(0x1.4f8b58p-17)]; tensor input_axes_0 = const()[name = tensor("input_axes_0"), val = tensor([-1])]; tensor input = layer_norm(axes = input_axes_0, beta = out_norm_bias, epsilon = var_2574, gamma = out_norm_weight, x = input_63)[name = tensor("input")]; tensor var_2582 = linear(bias = out_eos_bias, weight = out_eos_weight, x = input)[name = tensor("linear_25")]; } -> (input, var_2582, new_cache_1_internal_tensor_assign_2, var_458, new_cache_3_internal_tensor_assign_2, var_877, new_cache_5_internal_tensor_assign_2, var_1296, new_cache_7_internal_tensor_assign_2, var_1715, new_cache_9_internal_tensor_assign_2, var_2134, new_cache_internal_tensor_assign_2, var_2553); }