program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "4.28.4"}, {"coremlc-version", "1436.100.10"}})] { func main(tensor logmel_data) { tensor var_20 = const()[name = tensor("op_20"), val = tensor(1)]; tensor var_28 = const()[name = tensor("op_28"), val = tensor([1])]; tensor var_30 = const()[name = tensor("op_30"), val = tensor([1])]; tensor var_32_pad_type_0 = const()[name = tensor("op_32_pad_type_0"), val = tensor("custom")]; tensor var_32_pad_0 = const()[name = tensor("op_32_pad_0"), val = tensor([1, 1])]; tensor logmel_data_to_fp16_dtype_0 = const()[name = tensor("logmel_data_to_fp16_dtype_0"), val = tensor("fp16")]; tensor weight_3_to_fp16 = const()[name = tensor("weight_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor bias_3_to_fp16 = const()[name = tensor("bias_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245888)))]; tensor cast_187 = cast(dtype = logmel_data_to_fp16_dtype_0, x = logmel_data); tensor var_32_cast = conv(bias = bias_3_to_fp16, dilations = var_30, groups = var_20, pad = var_32_pad_0, pad_type = var_32_pad_type_0, strides = var_28, weight = weight_3_to_fp16, x = cast_187); tensor input_1_mode_0 = const()[name = tensor("input_1_mode_0"), val = tensor("EXACT")]; tensor input_1_cast = gelu(mode = input_1_mode_0, x = var_32_cast); tensor var_36 = const()[name = tensor("op_36"), val = tensor(1)]; tensor var_45 = const()[name = tensor("op_45"), val = tensor([2])]; tensor var_47 = const()[name = tensor("op_47"), val = tensor([1])]; tensor var_49_pad_type_0 = const()[name = tensor("op_49_pad_type_0"), val = tensor("custom")]; tensor var_49_pad_0 = const()[name = tensor("op_49_pad_0"), val = tensor([1, 1])]; tensor weight_7_to_fp16 = const()[name = tensor("weight_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(246976)))]; tensor bias_7_to_fp16 = const()[name = tensor("bias_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1819904)))]; tensor var_49_cast = conv(bias = bias_7_to_fp16, dilations = var_47, groups = var_36, pad = var_49_pad_0, pad_type = var_49_pad_type_0, strides = var_45, weight = weight_7_to_fp16, x = input_1_cast); tensor x_3_mode_0 = const()[name = tensor("x_3_mode_0"), val = tensor("EXACT")]; tensor x_3_cast = gelu(mode = x_3_mode_0, x = var_49_cast); tensor var_54 = const()[name = tensor("op_54"), val = tensor([0, 2, 1])]; tensor positional_embedding_to_fp16 = const()[name = tensor("positional_embedding_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1820992)))]; tensor transpose_48 = transpose(perm = var_54, x = x_3_cast); tensor var_57_cast = add(x = transpose_48, y = positional_embedding_to_fp16); tensor var_70 = const()[name = tensor("op_70"), val = tensor(-1)]; tensor var_87_axes_0 = const()[name = tensor("op_87_axes_0"), val = tensor([-1])]; tensor blocks_0_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_0_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3357056)))]; tensor blocks_0_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_0_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3358144)))]; tensor var_76_to_fp16 = const()[name = tensor("op_76_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_87_cast = layer_norm(axes = var_87_axes_0, beta = blocks_0_attn_ln_bias_to_fp16, epsilon = var_76_to_fp16, gamma = blocks_0_attn_ln_weight_to_fp16, x = var_57_cast); tensor var_98_to_fp16 = const()[name = tensor("op_98_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3359232)))]; tensor var_99_to_fp16 = const()[name = tensor("op_99_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3883584)))]; tensor q_1_cast = linear(bias = var_99_to_fp16, weight = var_98_to_fp16, x = var_87_cast); tensor var_102_to_fp16 = const()[name = tensor("op_102_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3884672)))]; tensor k_1_bias_0_to_fp16 = const()[name = tensor("k_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4409024)))]; tensor k_1_cast = linear(bias = k_1_bias_0_to_fp16, weight = var_102_to_fp16, x = var_87_cast); tensor var_106_to_fp16 = const()[name = tensor("op_106_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4410112)))]; tensor var_107_to_fp16 = const()[name = tensor("op_107_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4934464)))]; tensor v_1_cast = linear(bias = var_107_to_fp16, weight = var_106_to_fp16, x = var_87_cast); tensor var_115 = const()[name = tensor("op_115"), val = tensor([1, 1500, 8, -1])]; tensor var_116_cast = reshape(shape = var_115, x = q_1_cast); tensor const_42_to_fp16 = const()[name = tensor("const_42_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_3_cast = mul(x = var_116_cast, y = const_42_to_fp16); tensor var_122 = const()[name = tensor("op_122"), val = tensor([1, 1500, 8, -1])]; tensor var_123_cast = reshape(shape = var_122, x = k_1_cast); tensor const_43_to_fp16 = const()[name = tensor("const_43_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_3_cast = mul(x = var_123_cast, y = const_43_to_fp16); tensor var_129 = const()[name = tensor("op_129"), val = tensor([1, 1500, 8, -1])]; tensor var_130_cast = reshape(shape = var_129, x = v_1_cast); tensor var_131 = const()[name = tensor("op_131"), val = tensor([0, 2, 1, 3])]; tensor qk_1_transpose_x_0 = const()[name = tensor("qk_1_transpose_x_0"), val = tensor(false)]; tensor qk_1_transpose_y_0 = const()[name = tensor("qk_1_transpose_y_0"), val = tensor(false)]; tensor transpose_12_perm_0 = const()[name = tensor("transpose_12_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_13_perm_0 = const()[name = tensor("transpose_13_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_45 = transpose(perm = transpose_13_perm_0, x = k_3_cast); tensor transpose_46 = transpose(perm = transpose_12_perm_0, x = q_3_cast); tensor qk_1_cast = matmul(transpose_x = qk_1_transpose_x_0, transpose_y = qk_1_transpose_y_0, x = transpose_46, y = transpose_45); tensor var_135_cast = softmax(axis = var_70, x = qk_1_cast); tensor var_137_transpose_x_0 = const()[name = tensor("op_137_transpose_x_0"), val = tensor(false)]; tensor var_137_transpose_y_0 = const()[name = tensor("op_137_transpose_y_0"), val = tensor(false)]; tensor transpose_47 = transpose(perm = var_131, x = var_130_cast); tensor var_137_cast = matmul(transpose_x = var_137_transpose_x_0, transpose_y = var_137_transpose_y_0, x = var_135_cast, y = transpose_47); tensor var_138 = const()[name = tensor("op_138"), val = tensor([0, 2, 1, 3])]; tensor concat_0 = const()[name = tensor("concat_0"), val = tensor([1, 1500, 512])]; tensor transpose_44 = transpose(perm = var_138, x = var_137_cast); tensor x_11_cast = reshape(shape = concat_0, x = transpose_44); tensor var_143_to_fp16 = const()[name = tensor("op_143_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4935552)))]; tensor var_144_to_fp16 = const()[name = tensor("op_144_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5459904)))]; tensor var_145_cast = linear(bias = var_144_to_fp16, weight = var_143_to_fp16, x = x_11_cast); tensor x_13_cast = add(x = var_57_cast, y = var_145_cast); tensor var_151_axes_0 = const()[name = tensor("op_151_axes_0"), val = tensor([-1])]; tensor blocks_0_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5460992)))]; tensor blocks_0_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5462080)))]; tensor var_151_cast = layer_norm(axes = var_151_axes_0, beta = blocks_0_mlp_ln_bias_to_fp16, epsilon = var_76_to_fp16, gamma = blocks_0_mlp_ln_weight_to_fp16, x = x_13_cast); tensor var_160_to_fp16 = const()[name = tensor("op_160_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5463168)))]; tensor var_161_to_fp16 = const()[name = tensor("op_161_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7560384)))]; tensor input_9_cast = linear(bias = var_161_to_fp16, weight = var_160_to_fp16, x = var_151_cast); tensor x_17_mode_0 = const()[name = tensor("x_17_mode_0"), val = tensor("EXACT")]; tensor x_17_cast = gelu(mode = x_17_mode_0, x = input_9_cast); tensor var_166_to_fp16 = const()[name = tensor("op_166_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(7564544)))]; tensor var_167_to_fp16 = const()[name = tensor("op_167_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9661760)))]; tensor var_168_cast = linear(bias = var_167_to_fp16, weight = var_166_to_fp16, x = x_17_cast); tensor x_19_cast = add(x = x_13_cast, y = var_168_cast); tensor var_177 = const()[name = tensor("op_177"), val = tensor(-1)]; tensor var_194_axes_0 = const()[name = tensor("op_194_axes_0"), val = tensor([-1])]; tensor blocks_1_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_1_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9662848)))]; tensor blocks_1_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_1_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9663936)))]; tensor var_183_to_fp16 = const()[name = tensor("op_183_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_194_cast = layer_norm(axes = var_194_axes_0, beta = blocks_1_attn_ln_bias_to_fp16, epsilon = var_183_to_fp16, gamma = blocks_1_attn_ln_weight_to_fp16, x = x_19_cast); tensor var_205_to_fp16 = const()[name = tensor("op_205_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9665024)))]; tensor var_206_to_fp16 = const()[name = tensor("op_206_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10189376)))]; tensor q_5_cast = linear(bias = var_206_to_fp16, weight = var_205_to_fp16, x = var_194_cast); tensor var_209_to_fp16 = const()[name = tensor("op_209_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10190464)))]; tensor k_5_bias_0_to_fp16 = const()[name = tensor("k_5_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10714816)))]; tensor k_5_cast = linear(bias = k_5_bias_0_to_fp16, weight = var_209_to_fp16, x = var_194_cast); tensor var_213_to_fp16 = const()[name = tensor("op_213_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10715904)))]; tensor var_214_to_fp16 = const()[name = tensor("op_214_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11240256)))]; tensor v_5_cast = linear(bias = var_214_to_fp16, weight = var_213_to_fp16, x = var_194_cast); tensor var_222 = const()[name = tensor("op_222"), val = tensor([1, 1500, 8, -1])]; tensor var_223_cast = reshape(shape = var_222, x = q_5_cast); tensor const_44_to_fp16 = const()[name = tensor("const_44_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_7_cast = mul(x = var_223_cast, y = const_44_to_fp16); tensor var_229 = const()[name = tensor("op_229"), val = tensor([1, 1500, 8, -1])]; tensor var_230_cast = reshape(shape = var_229, x = k_5_cast); tensor const_45_to_fp16 = const()[name = tensor("const_45_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_7_cast = mul(x = var_230_cast, y = const_45_to_fp16); tensor var_236 = const()[name = tensor("op_236"), val = tensor([1, 1500, 8, -1])]; tensor var_237_cast = reshape(shape = var_236, x = v_5_cast); tensor var_238 = const()[name = tensor("op_238"), val = tensor([0, 2, 1, 3])]; tensor qk_3_transpose_x_0 = const()[name = tensor("qk_3_transpose_x_0"), val = tensor(false)]; tensor qk_3_transpose_y_0 = const()[name = tensor("qk_3_transpose_y_0"), val = tensor(false)]; tensor transpose_14_perm_0 = const()[name = tensor("transpose_14_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_15_perm_0 = const()[name = tensor("transpose_15_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_41 = transpose(perm = transpose_15_perm_0, x = k_7_cast); tensor transpose_42 = transpose(perm = transpose_14_perm_0, x = q_7_cast); tensor qk_3_cast = matmul(transpose_x = qk_3_transpose_x_0, transpose_y = qk_3_transpose_y_0, x = transpose_42, y = transpose_41); tensor var_242_cast = softmax(axis = var_177, x = qk_3_cast); tensor var_244_transpose_x_0 = const()[name = tensor("op_244_transpose_x_0"), val = tensor(false)]; tensor var_244_transpose_y_0 = const()[name = tensor("op_244_transpose_y_0"), val = tensor(false)]; tensor transpose_43 = transpose(perm = var_238, x = var_237_cast); tensor var_244_cast = matmul(transpose_x = var_244_transpose_x_0, transpose_y = var_244_transpose_y_0, x = var_242_cast, y = transpose_43); tensor var_245 = const()[name = tensor("op_245"), val = tensor([0, 2, 1, 3])]; tensor concat_1 = const()[name = tensor("concat_1"), val = tensor([1, 1500, 512])]; tensor transpose_40 = transpose(perm = var_245, x = var_244_cast); tensor x_23_cast = reshape(shape = concat_1, x = transpose_40); tensor var_250_to_fp16 = const()[name = tensor("op_250_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11241344)))]; tensor var_251_to_fp16 = const()[name = tensor("op_251_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11765696)))]; tensor var_252_cast = linear(bias = var_251_to_fp16, weight = var_250_to_fp16, x = x_23_cast); tensor x_25_cast = add(x = x_19_cast, y = var_252_cast); tensor var_258_axes_0 = const()[name = tensor("op_258_axes_0"), val = tensor([-1])]; tensor blocks_1_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11766784)))]; tensor blocks_1_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11767872)))]; tensor var_258_cast = layer_norm(axes = var_258_axes_0, beta = blocks_1_mlp_ln_bias_to_fp16, epsilon = var_183_to_fp16, gamma = blocks_1_mlp_ln_weight_to_fp16, x = x_25_cast); tensor var_267_to_fp16 = const()[name = tensor("op_267_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11768960)))]; tensor var_268_to_fp16 = const()[name = tensor("op_268_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13866176)))]; tensor input_17_cast = linear(bias = var_268_to_fp16, weight = var_267_to_fp16, x = var_258_cast); tensor x_29_mode_0 = const()[name = tensor("x_29_mode_0"), val = tensor("EXACT")]; tensor x_29_cast = gelu(mode = x_29_mode_0, x = input_17_cast); tensor var_273_to_fp16 = const()[name = tensor("op_273_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13870336)))]; tensor var_274_to_fp16 = const()[name = tensor("op_274_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15967552)))]; tensor var_275_cast = linear(bias = var_274_to_fp16, weight = var_273_to_fp16, x = x_29_cast); tensor x_31_cast = add(x = x_25_cast, y = var_275_cast); tensor var_284 = const()[name = tensor("op_284"), val = tensor(-1)]; tensor var_301_axes_0 = const()[name = tensor("op_301_axes_0"), val = tensor([-1])]; tensor blocks_2_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_2_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15968640)))]; tensor blocks_2_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_2_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15969728)))]; tensor var_290_to_fp16 = const()[name = tensor("op_290_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_301_cast = layer_norm(axes = var_301_axes_0, beta = blocks_2_attn_ln_bias_to_fp16, epsilon = var_290_to_fp16, gamma = blocks_2_attn_ln_weight_to_fp16, x = x_31_cast); tensor var_312_to_fp16 = const()[name = tensor("op_312_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15970816)))]; tensor var_313_to_fp16 = const()[name = tensor("op_313_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16495168)))]; tensor q_9_cast = linear(bias = var_313_to_fp16, weight = var_312_to_fp16, x = var_301_cast); tensor var_316_to_fp16 = const()[name = tensor("op_316_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16496256)))]; tensor k_9_bias_0_to_fp16 = const()[name = tensor("k_9_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17020608)))]; tensor k_9_cast = linear(bias = k_9_bias_0_to_fp16, weight = var_316_to_fp16, x = var_301_cast); tensor var_320_to_fp16 = const()[name = tensor("op_320_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17021696)))]; tensor var_321_to_fp16 = const()[name = tensor("op_321_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17546048)))]; tensor v_9_cast = linear(bias = var_321_to_fp16, weight = var_320_to_fp16, x = var_301_cast); tensor var_329 = const()[name = tensor("op_329"), val = tensor([1, 1500, 8, -1])]; tensor var_330_cast = reshape(shape = var_329, x = q_9_cast); tensor const_46_to_fp16 = const()[name = tensor("const_46_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_11_cast = mul(x = var_330_cast, y = const_46_to_fp16); tensor var_336 = const()[name = tensor("op_336"), val = tensor([1, 1500, 8, -1])]; tensor var_337_cast = reshape(shape = var_336, x = k_9_cast); tensor const_47_to_fp16 = const()[name = tensor("const_47_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_11_cast = mul(x = var_337_cast, y = const_47_to_fp16); tensor var_343 = const()[name = tensor("op_343"), val = tensor([1, 1500, 8, -1])]; tensor var_344_cast = reshape(shape = var_343, x = v_9_cast); tensor var_345 = const()[name = tensor("op_345"), val = tensor([0, 2, 1, 3])]; tensor qk_5_transpose_x_0 = const()[name = tensor("qk_5_transpose_x_0"), val = tensor(false)]; tensor qk_5_transpose_y_0 = const()[name = tensor("qk_5_transpose_y_0"), val = tensor(false)]; tensor transpose_16_perm_0 = const()[name = tensor("transpose_16_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_17_perm_0 = const()[name = tensor("transpose_17_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_37 = transpose(perm = transpose_17_perm_0, x = k_11_cast); tensor transpose_38 = transpose(perm = transpose_16_perm_0, x = q_11_cast); tensor qk_5_cast = matmul(transpose_x = qk_5_transpose_x_0, transpose_y = qk_5_transpose_y_0, x = transpose_38, y = transpose_37); tensor var_349_cast = softmax(axis = var_284, x = qk_5_cast); tensor var_351_transpose_x_0 = const()[name = tensor("op_351_transpose_x_0"), val = tensor(false)]; tensor var_351_transpose_y_0 = const()[name = tensor("op_351_transpose_y_0"), val = tensor(false)]; tensor transpose_39 = transpose(perm = var_345, x = var_344_cast); tensor var_351_cast = matmul(transpose_x = var_351_transpose_x_0, transpose_y = var_351_transpose_y_0, x = var_349_cast, y = transpose_39); tensor var_352 = const()[name = tensor("op_352"), val = tensor([0, 2, 1, 3])]; tensor concat_2 = const()[name = tensor("concat_2"), val = tensor([1, 1500, 512])]; tensor transpose_36 = transpose(perm = var_352, x = var_351_cast); tensor x_35_cast = reshape(shape = concat_2, x = transpose_36); tensor var_357_to_fp16 = const()[name = tensor("op_357_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(17547136)))]; tensor var_358_to_fp16 = const()[name = tensor("op_358_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18071488)))]; tensor var_359_cast = linear(bias = var_358_to_fp16, weight = var_357_to_fp16, x = x_35_cast); tensor x_37_cast = add(x = x_31_cast, y = var_359_cast); tensor var_365_axes_0 = const()[name = tensor("op_365_axes_0"), val = tensor([-1])]; tensor blocks_2_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18072576)))]; tensor blocks_2_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18073664)))]; tensor var_365_cast = layer_norm(axes = var_365_axes_0, beta = blocks_2_mlp_ln_bias_to_fp16, epsilon = var_290_to_fp16, gamma = blocks_2_mlp_ln_weight_to_fp16, x = x_37_cast); tensor var_374_to_fp16 = const()[name = tensor("op_374_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18074752)))]; tensor var_375_to_fp16 = const()[name = tensor("op_375_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20171968)))]; tensor input_25_cast = linear(bias = var_375_to_fp16, weight = var_374_to_fp16, x = var_365_cast); tensor x_41_mode_0 = const()[name = tensor("x_41_mode_0"), val = tensor("EXACT")]; tensor x_41_cast = gelu(mode = x_41_mode_0, x = input_25_cast); tensor var_380_to_fp16 = const()[name = tensor("op_380_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(20176128)))]; tensor var_381_to_fp16 = const()[name = tensor("op_381_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22273344)))]; tensor var_382_cast = linear(bias = var_381_to_fp16, weight = var_380_to_fp16, x = x_41_cast); tensor x_43_cast = add(x = x_37_cast, y = var_382_cast); tensor var_391 = const()[name = tensor("op_391"), val = tensor(-1)]; tensor var_408_axes_0 = const()[name = tensor("op_408_axes_0"), val = tensor([-1])]; tensor blocks_3_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_3_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22274432)))]; tensor blocks_3_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_3_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22275520)))]; tensor var_397_to_fp16 = const()[name = tensor("op_397_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_408_cast = layer_norm(axes = var_408_axes_0, beta = blocks_3_attn_ln_bias_to_fp16, epsilon = var_397_to_fp16, gamma = blocks_3_attn_ln_weight_to_fp16, x = x_43_cast); tensor var_419_to_fp16 = const()[name = tensor("op_419_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22276608)))]; tensor var_420_to_fp16 = const()[name = tensor("op_420_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22800960)))]; tensor q_13_cast = linear(bias = var_420_to_fp16, weight = var_419_to_fp16, x = var_408_cast); tensor var_423_to_fp16 = const()[name = tensor("op_423_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(22802048)))]; tensor k_13_bias_0_to_fp16 = const()[name = tensor("k_13_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23326400)))]; tensor k_13_cast = linear(bias = k_13_bias_0_to_fp16, weight = var_423_to_fp16, x = var_408_cast); tensor var_427_to_fp16 = const()[name = tensor("op_427_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23327488)))]; tensor var_428_to_fp16 = const()[name = tensor("op_428_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23851840)))]; tensor v_13_cast = linear(bias = var_428_to_fp16, weight = var_427_to_fp16, x = var_408_cast); tensor var_436 = const()[name = tensor("op_436"), val = tensor([1, 1500, 8, -1])]; tensor var_437_cast = reshape(shape = var_436, x = q_13_cast); tensor const_48_to_fp16 = const()[name = tensor("const_48_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_15_cast = mul(x = var_437_cast, y = const_48_to_fp16); tensor var_443 = const()[name = tensor("op_443"), val = tensor([1, 1500, 8, -1])]; tensor var_444_cast = reshape(shape = var_443, x = k_13_cast); tensor const_49_to_fp16 = const()[name = tensor("const_49_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_15_cast = mul(x = var_444_cast, y = const_49_to_fp16); tensor var_450 = const()[name = tensor("op_450"), val = tensor([1, 1500, 8, -1])]; tensor var_451_cast = reshape(shape = var_450, x = v_13_cast); tensor var_452 = const()[name = tensor("op_452"), val = tensor([0, 2, 1, 3])]; tensor qk_7_transpose_x_0 = const()[name = tensor("qk_7_transpose_x_0"), val = tensor(false)]; tensor qk_7_transpose_y_0 = const()[name = tensor("qk_7_transpose_y_0"), val = tensor(false)]; tensor transpose_18_perm_0 = const()[name = tensor("transpose_18_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_19_perm_0 = const()[name = tensor("transpose_19_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_33 = transpose(perm = transpose_19_perm_0, x = k_15_cast); tensor transpose_34 = transpose(perm = transpose_18_perm_0, x = q_15_cast); tensor qk_7_cast = matmul(transpose_x = qk_7_transpose_x_0, transpose_y = qk_7_transpose_y_0, x = transpose_34, y = transpose_33); tensor var_456_cast = softmax(axis = var_391, x = qk_7_cast); tensor var_458_transpose_x_0 = const()[name = tensor("op_458_transpose_x_0"), val = tensor(false)]; tensor var_458_transpose_y_0 = const()[name = tensor("op_458_transpose_y_0"), val = tensor(false)]; tensor transpose_35 = transpose(perm = var_452, x = var_451_cast); tensor var_458_cast = matmul(transpose_x = var_458_transpose_x_0, transpose_y = var_458_transpose_y_0, x = var_456_cast, y = transpose_35); tensor var_459 = const()[name = tensor("op_459"), val = tensor([0, 2, 1, 3])]; tensor concat_3 = const()[name = tensor("concat_3"), val = tensor([1, 1500, 512])]; tensor transpose_32 = transpose(perm = var_459, x = var_458_cast); tensor x_47_cast = reshape(shape = concat_3, x = transpose_32); tensor var_464_to_fp16 = const()[name = tensor("op_464_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(23852928)))]; tensor var_465_to_fp16 = const()[name = tensor("op_465_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24377280)))]; tensor var_466_cast = linear(bias = var_465_to_fp16, weight = var_464_to_fp16, x = x_47_cast); tensor x_49_cast = add(x = x_43_cast, y = var_466_cast); tensor var_472_axes_0 = const()[name = tensor("op_472_axes_0"), val = tensor([-1])]; tensor blocks_3_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24378368)))]; tensor blocks_3_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24379456)))]; tensor var_472_cast = layer_norm(axes = var_472_axes_0, beta = blocks_3_mlp_ln_bias_to_fp16, epsilon = var_397_to_fp16, gamma = blocks_3_mlp_ln_weight_to_fp16, x = x_49_cast); tensor var_481_to_fp16 = const()[name = tensor("op_481_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(24380544)))]; tensor var_482_to_fp16 = const()[name = tensor("op_482_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26477760)))]; tensor input_33_cast = linear(bias = var_482_to_fp16, weight = var_481_to_fp16, x = var_472_cast); tensor x_53_mode_0 = const()[name = tensor("x_53_mode_0"), val = tensor("EXACT")]; tensor x_53_cast = gelu(mode = x_53_mode_0, x = input_33_cast); tensor var_487_to_fp16 = const()[name = tensor("op_487_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26481920)))]; tensor var_488_to_fp16 = const()[name = tensor("op_488_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28579136)))]; tensor var_489_cast = linear(bias = var_488_to_fp16, weight = var_487_to_fp16, x = x_53_cast); tensor x_55_cast = add(x = x_49_cast, y = var_489_cast); tensor var_498 = const()[name = tensor("op_498"), val = tensor(-1)]; tensor var_515_axes_0 = const()[name = tensor("op_515_axes_0"), val = tensor([-1])]; tensor blocks_4_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_4_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28580224)))]; tensor blocks_4_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_4_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28581312)))]; tensor var_504_to_fp16 = const()[name = tensor("op_504_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_515_cast = layer_norm(axes = var_515_axes_0, beta = blocks_4_attn_ln_bias_to_fp16, epsilon = var_504_to_fp16, gamma = blocks_4_attn_ln_weight_to_fp16, x = x_55_cast); tensor var_526_to_fp16 = const()[name = tensor("op_526_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(28582400)))]; tensor var_527_to_fp16 = const()[name = tensor("op_527_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29106752)))]; tensor q_17_cast = linear(bias = var_527_to_fp16, weight = var_526_to_fp16, x = var_515_cast); tensor var_530_to_fp16 = const()[name = tensor("op_530_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29107840)))]; tensor k_17_bias_0_to_fp16 = const()[name = tensor("k_17_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29632192)))]; tensor k_17_cast = linear(bias = k_17_bias_0_to_fp16, weight = var_530_to_fp16, x = var_515_cast); tensor var_534_to_fp16 = const()[name = tensor("op_534_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(29633280)))]; tensor var_535_to_fp16 = const()[name = tensor("op_535_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30157632)))]; tensor v_17_cast = linear(bias = var_535_to_fp16, weight = var_534_to_fp16, x = var_515_cast); tensor var_543 = const()[name = tensor("op_543"), val = tensor([1, 1500, 8, -1])]; tensor var_544_cast = reshape(shape = var_543, x = q_17_cast); tensor const_50_to_fp16 = const()[name = tensor("const_50_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_19_cast = mul(x = var_544_cast, y = const_50_to_fp16); tensor var_550 = const()[name = tensor("op_550"), val = tensor([1, 1500, 8, -1])]; tensor var_551_cast = reshape(shape = var_550, x = k_17_cast); tensor const_51_to_fp16 = const()[name = tensor("const_51_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_19_cast = mul(x = var_551_cast, y = const_51_to_fp16); tensor var_557 = const()[name = tensor("op_557"), val = tensor([1, 1500, 8, -1])]; tensor var_558_cast = reshape(shape = var_557, x = v_17_cast); tensor var_559 = const()[name = tensor("op_559"), val = tensor([0, 2, 1, 3])]; tensor qk_9_transpose_x_0 = const()[name = tensor("qk_9_transpose_x_0"), val = tensor(false)]; tensor qk_9_transpose_y_0 = const()[name = tensor("qk_9_transpose_y_0"), val = tensor(false)]; tensor transpose_20_perm_0 = const()[name = tensor("transpose_20_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_21_perm_0 = const()[name = tensor("transpose_21_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_29 = transpose(perm = transpose_21_perm_0, x = k_19_cast); tensor transpose_30 = transpose(perm = transpose_20_perm_0, x = q_19_cast); tensor qk_9_cast = matmul(transpose_x = qk_9_transpose_x_0, transpose_y = qk_9_transpose_y_0, x = transpose_30, y = transpose_29); tensor var_563_cast = softmax(axis = var_498, x = qk_9_cast); tensor var_565_transpose_x_0 = const()[name = tensor("op_565_transpose_x_0"), val = tensor(false)]; tensor var_565_transpose_y_0 = const()[name = tensor("op_565_transpose_y_0"), val = tensor(false)]; tensor transpose_31 = transpose(perm = var_559, x = var_558_cast); tensor var_565_cast = matmul(transpose_x = var_565_transpose_x_0, transpose_y = var_565_transpose_y_0, x = var_563_cast, y = transpose_31); tensor var_566 = const()[name = tensor("op_566"), val = tensor([0, 2, 1, 3])]; tensor concat_4 = const()[name = tensor("concat_4"), val = tensor([1, 1500, 512])]; tensor transpose_28 = transpose(perm = var_566, x = var_565_cast); tensor x_59_cast = reshape(shape = concat_4, x = transpose_28); tensor var_571_to_fp16 = const()[name = tensor("op_571_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30158720)))]; tensor var_572_to_fp16 = const()[name = tensor("op_572_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30683072)))]; tensor var_573_cast = linear(bias = var_572_to_fp16, weight = var_571_to_fp16, x = x_59_cast); tensor x_61_cast = add(x = x_55_cast, y = var_573_cast); tensor var_579_axes_0 = const()[name = tensor("op_579_axes_0"), val = tensor([-1])]; tensor blocks_4_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30684160)))]; tensor blocks_4_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30685248)))]; tensor var_579_cast = layer_norm(axes = var_579_axes_0, beta = blocks_4_mlp_ln_bias_to_fp16, epsilon = var_504_to_fp16, gamma = blocks_4_mlp_ln_weight_to_fp16, x = x_61_cast); tensor var_588_to_fp16 = const()[name = tensor("op_588_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(30686336)))]; tensor var_589_to_fp16 = const()[name = tensor("op_589_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32783552)))]; tensor input_41_cast = linear(bias = var_589_to_fp16, weight = var_588_to_fp16, x = var_579_cast); tensor x_65_mode_0 = const()[name = tensor("x_65_mode_0"), val = tensor("EXACT")]; tensor x_65_cast = gelu(mode = x_65_mode_0, x = input_41_cast); tensor var_594_to_fp16 = const()[name = tensor("op_594_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(32787712)))]; tensor var_595_to_fp16 = const()[name = tensor("op_595_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34884928)))]; tensor var_596_cast = linear(bias = var_595_to_fp16, weight = var_594_to_fp16, x = x_65_cast); tensor x_67_cast = add(x = x_61_cast, y = var_596_cast); tensor var_605 = const()[name = tensor("op_605"), val = tensor(-1)]; tensor var_622_axes_0 = const()[name = tensor("op_622_axes_0"), val = tensor([-1])]; tensor blocks_5_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_5_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34886016)))]; tensor blocks_5_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_5_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34887104)))]; tensor var_611_to_fp16 = const()[name = tensor("op_611_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_622_cast = layer_norm(axes = var_622_axes_0, beta = blocks_5_attn_ln_bias_to_fp16, epsilon = var_611_to_fp16, gamma = blocks_5_attn_ln_weight_to_fp16, x = x_67_cast); tensor var_633_to_fp16 = const()[name = tensor("op_633_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(34888192)))]; tensor var_634_to_fp16 = const()[name = tensor("op_634_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35412544)))]; tensor q_21_cast = linear(bias = var_634_to_fp16, weight = var_633_to_fp16, x = var_622_cast); tensor var_637_to_fp16 = const()[name = tensor("op_637_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35413632)))]; tensor k_21_bias_0_to_fp16 = const()[name = tensor("k_21_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35937984)))]; tensor k_21_cast = linear(bias = k_21_bias_0_to_fp16, weight = var_637_to_fp16, x = var_622_cast); tensor var_641_to_fp16 = const()[name = tensor("op_641_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35939072)))]; tensor var_642_to_fp16 = const()[name = tensor("op_642_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36463424)))]; tensor v_21_cast = linear(bias = var_642_to_fp16, weight = var_641_to_fp16, x = var_622_cast); tensor var_650 = const()[name = tensor("op_650"), val = tensor([1, 1500, 8, -1])]; tensor var_651_cast = reshape(shape = var_650, x = q_21_cast); tensor const_52_to_fp16 = const()[name = tensor("const_52_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_cast = mul(x = var_651_cast, y = const_52_to_fp16); tensor var_657 = const()[name = tensor("op_657"), val = tensor([1, 1500, 8, -1])]; tensor var_658_cast = reshape(shape = var_657, x = k_21_cast); tensor const_53_to_fp16 = const()[name = tensor("const_53_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_cast = mul(x = var_658_cast, y = const_53_to_fp16); tensor var_664 = const()[name = tensor("op_664"), val = tensor([1, 1500, 8, -1])]; tensor var_665_cast = reshape(shape = var_664, x = v_21_cast); tensor var_666 = const()[name = tensor("op_666"), val = tensor([0, 2, 1, 3])]; tensor qk_transpose_x_0 = const()[name = tensor("qk_transpose_x_0"), val = tensor(false)]; tensor qk_transpose_y_0 = const()[name = tensor("qk_transpose_y_0"), val = tensor(false)]; tensor transpose_22_perm_0 = const()[name = tensor("transpose_22_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_23_perm_0 = const()[name = tensor("transpose_23_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_25 = transpose(perm = transpose_23_perm_0, x = k_cast); tensor transpose_26 = transpose(perm = transpose_22_perm_0, x = q_cast); tensor qk_cast = matmul(transpose_x = qk_transpose_x_0, transpose_y = qk_transpose_y_0, x = transpose_26, y = transpose_25); tensor var_670_cast = softmax(axis = var_605, x = qk_cast); tensor var_672_transpose_x_0 = const()[name = tensor("op_672_transpose_x_0"), val = tensor(false)]; tensor var_672_transpose_y_0 = const()[name = tensor("op_672_transpose_y_0"), val = tensor(false)]; tensor transpose_27 = transpose(perm = var_666, x = var_665_cast); tensor var_672_cast = matmul(transpose_x = var_672_transpose_x_0, transpose_y = var_672_transpose_y_0, x = var_670_cast, y = transpose_27); tensor var_673 = const()[name = tensor("op_673"), val = tensor([0, 2, 1, 3])]; tensor concat_5 = const()[name = tensor("concat_5"), val = tensor([1, 1500, 512])]; tensor transpose_24 = transpose(perm = var_673, x = var_672_cast); tensor x_71_cast = reshape(shape = concat_5, x = transpose_24); tensor var_678_to_fp16 = const()[name = tensor("op_678_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36464512)))]; tensor var_679_to_fp16 = const()[name = tensor("op_679_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36988864)))]; tensor var_680_cast = linear(bias = var_679_to_fp16, weight = var_678_to_fp16, x = x_71_cast); tensor x_73_cast = add(x = x_67_cast, y = var_680_cast); tensor var_686_axes_0 = const()[name = tensor("op_686_axes_0"), val = tensor([-1])]; tensor blocks_5_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36989952)))]; tensor blocks_5_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36991040)))]; tensor var_686_cast = layer_norm(axes = var_686_axes_0, beta = blocks_5_mlp_ln_bias_to_fp16, epsilon = var_611_to_fp16, gamma = blocks_5_mlp_ln_weight_to_fp16, x = x_73_cast); tensor var_695_to_fp16 = const()[name = tensor("op_695_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(36992128)))]; tensor var_696_to_fp16 = const()[name = tensor("op_696_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39089344)))]; tensor input_49_cast = linear(bias = var_696_to_fp16, weight = var_695_to_fp16, x = var_686_cast); tensor x_77_mode_0 = const()[name = tensor("x_77_mode_0"), val = tensor("EXACT")]; tensor x_77_cast = gelu(mode = x_77_mode_0, x = input_49_cast); tensor var_701_to_fp16 = const()[name = tensor("op_701_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39093504)))]; tensor var_702_to_fp16 = const()[name = tensor("op_702_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41190720)))]; tensor var_703_cast = linear(bias = var_702_to_fp16, weight = var_701_to_fp16, x = x_77_cast); tensor x_cast = add(x = x_73_cast, y = var_703_cast); tensor var_716_axes_0 = const()[name = tensor("op_716_axes_0"), val = tensor([-1])]; tensor ln_post_weight_to_fp16 = const()[name = tensor("ln_post_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41191808)))]; tensor ln_post_bias_to_fp16 = const()[name = tensor("ln_post_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41192896)))]; tensor var_707_to_fp16 = const()[name = tensor("op_707_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_716_cast = layer_norm(axes = var_716_axes_0, beta = ln_post_bias_to_fp16, epsilon = var_707_to_fp16, gamma = ln_post_weight_to_fp16, x = x_cast); tensor var_716_cast_to_fp32_dtype_0 = const()[name = tensor("op_716_cast_to_fp32_dtype_0"), val = tensor("fp32")]; tensor output = cast(dtype = var_716_cast_to_fp32_dtype_0, x = var_716_cast); } -> (output); }