program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "4.28.4"}, {"coremlc-version", "1436.100.10"}})] { func main(tensor logmel_data) { tensor var_16 = const()[name = tensor("op_16"), val = tensor(1)]; tensor var_24 = const()[name = tensor("op_24"), val = tensor([1])]; tensor var_26 = const()[name = tensor("op_26"), val = tensor([1])]; tensor var_28_pad_type_0 = const()[name = tensor("op_28_pad_type_0"), val = tensor("custom")]; tensor var_28_pad_0 = const()[name = tensor("op_28_pad_0"), val = tensor([1, 1])]; tensor logmel_data_to_fp16_dtype_0 = const()[name = tensor("logmel_data_to_fp16_dtype_0"), val = tensor("fp16")]; tensor weight_3_to_fp16 = const()[name = tensor("weight_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor bias_3_to_fp16 = const()[name = tensor("bias_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(184448)))]; tensor cast_127 = cast(dtype = logmel_data_to_fp16_dtype_0, x = logmel_data); tensor var_28_cast = conv(bias = bias_3_to_fp16, dilations = var_26, groups = var_16, pad = var_28_pad_0, pad_type = var_28_pad_type_0, strides = var_24, weight = weight_3_to_fp16, x = cast_127); tensor input_1_mode_0 = const()[name = tensor("input_1_mode_0"), val = tensor("EXACT")]; tensor input_1_cast = gelu(mode = input_1_mode_0, x = var_28_cast); tensor var_32 = const()[name = tensor("op_32"), val = tensor(1)]; tensor var_41 = const()[name = tensor("op_41"), val = tensor([2])]; tensor var_43 = const()[name = tensor("op_43"), val = tensor([1])]; tensor var_45_pad_type_0 = const()[name = tensor("op_45_pad_type_0"), val = tensor("custom")]; tensor var_45_pad_0 = const()[name = tensor("op_45_pad_0"), val = tensor([1, 1])]; tensor weight_7_to_fp16 = const()[name = tensor("weight_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(185280)))]; tensor bias_7_to_fp16 = const()[name = tensor("bias_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1070080)))]; tensor var_45_cast = conv(bias = bias_7_to_fp16, dilations = var_43, groups = var_32, pad = var_45_pad_0, pad_type = var_45_pad_type_0, strides = var_41, weight = weight_7_to_fp16, x = input_1_cast); tensor x_3_mode_0 = const()[name = tensor("x_3_mode_0"), val = tensor("EXACT")]; tensor x_3_cast = gelu(mode = x_3_mode_0, x = var_45_cast); tensor var_50 = const()[name = tensor("op_50"), val = tensor([0, 2, 1])]; tensor positional_embedding_to_fp16 = const()[name = tensor("positional_embedding_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(1070912)))]; tensor transpose_32 = transpose(perm = var_50, x = x_3_cast); tensor var_53_cast = add(x = transpose_32, y = positional_embedding_to_fp16); tensor var_65 = const()[name = tensor("op_65"), val = tensor(-1)]; tensor var_82_axes_0 = const()[name = tensor("op_82_axes_0"), val = tensor([-1])]; tensor blocks_0_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_0_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2222976)))]; tensor blocks_0_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_0_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2223808)))]; tensor var_71_to_fp16 = const()[name = tensor("op_71_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_82_cast = layer_norm(axes = var_82_axes_0, beta = blocks_0_attn_ln_bias_to_fp16, epsilon = var_71_to_fp16, gamma = blocks_0_attn_ln_weight_to_fp16, x = var_53_cast); tensor var_93_to_fp16 = const()[name = tensor("op_93_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2224640)))]; tensor var_94_to_fp16 = const()[name = tensor("op_94_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2519616)))]; tensor q_1_cast = linear(bias = var_94_to_fp16, weight = var_93_to_fp16, x = var_82_cast); tensor var_97_to_fp16 = const()[name = tensor("op_97_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2520448)))]; tensor k_1_bias_0_to_fp16 = const()[name = tensor("k_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2815424)))]; tensor k_1_cast = linear(bias = k_1_bias_0_to_fp16, weight = var_97_to_fp16, x = var_82_cast); tensor var_101_to_fp16 = const()[name = tensor("op_101_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(2816256)))]; tensor var_102_to_fp16 = const()[name = tensor("op_102_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3111232)))]; tensor v_1_cast = linear(bias = var_102_to_fp16, weight = var_101_to_fp16, x = var_82_cast); tensor var_110 = const()[name = tensor("op_110"), val = tensor([1, 1500, 6, -1])]; tensor var_111_cast = reshape(shape = var_110, x = q_1_cast); tensor const_28_to_fp16 = const()[name = tensor("const_28_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_3_cast = mul(x = var_111_cast, y = const_28_to_fp16); tensor var_117 = const()[name = tensor("op_117"), val = tensor([1, 1500, 6, -1])]; tensor var_118_cast = reshape(shape = var_117, x = k_1_cast); tensor const_29_to_fp16 = const()[name = tensor("const_29_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_3_cast = mul(x = var_118_cast, y = const_29_to_fp16); tensor var_124 = const()[name = tensor("op_124"), val = tensor([1, 1500, 6, -1])]; tensor var_125_cast = reshape(shape = var_124, x = v_1_cast); tensor var_126 = const()[name = tensor("op_126"), val = tensor([0, 2, 1, 3])]; tensor qk_1_transpose_x_0 = const()[name = tensor("qk_1_transpose_x_0"), val = tensor(false)]; tensor qk_1_transpose_y_0 = const()[name = tensor("qk_1_transpose_y_0"), val = tensor(false)]; tensor transpose_8_perm_0 = const()[name = tensor("transpose_8_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_9_perm_0 = const()[name = tensor("transpose_9_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_29 = transpose(perm = transpose_9_perm_0, x = k_3_cast); tensor transpose_30 = transpose(perm = transpose_8_perm_0, x = q_3_cast); tensor qk_1_cast = matmul(transpose_x = qk_1_transpose_x_0, transpose_y = qk_1_transpose_y_0, x = transpose_30, y = transpose_29); tensor var_130_cast = softmax(axis = var_65, x = qk_1_cast); tensor var_132_transpose_x_0 = const()[name = tensor("op_132_transpose_x_0"), val = tensor(false)]; tensor var_132_transpose_y_0 = const()[name = tensor("op_132_transpose_y_0"), val = tensor(false)]; tensor transpose_31 = transpose(perm = var_126, x = var_125_cast); tensor var_132_cast = matmul(transpose_x = var_132_transpose_x_0, transpose_y = var_132_transpose_y_0, x = var_130_cast, y = transpose_31); tensor var_133 = const()[name = tensor("op_133"), val = tensor([0, 2, 1, 3])]; tensor concat_0 = const()[name = tensor("concat_0"), val = tensor([1, 1500, 384])]; tensor transpose_28 = transpose(perm = var_133, x = var_132_cast); tensor x_11_cast = reshape(shape = concat_0, x = transpose_28); tensor var_138_to_fp16 = const()[name = tensor("op_138_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3112064)))]; tensor var_139_to_fp16 = const()[name = tensor("op_139_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3407040)))]; tensor var_140_cast = linear(bias = var_139_to_fp16, weight = var_138_to_fp16, x = x_11_cast); tensor x_13_cast = add(x = var_53_cast, y = var_140_cast); tensor var_146_axes_0 = const()[name = tensor("op_146_axes_0"), val = tensor([-1])]; tensor blocks_0_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3407872)))]; tensor blocks_0_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3408704)))]; tensor var_146_cast = layer_norm(axes = var_146_axes_0, beta = blocks_0_mlp_ln_bias_to_fp16, epsilon = var_71_to_fp16, gamma = blocks_0_mlp_ln_weight_to_fp16, x = x_13_cast); tensor var_155_to_fp16 = const()[name = tensor("op_155_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(3409536)))]; tensor var_156_to_fp16 = const()[name = tensor("op_156_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4589248)))]; tensor input_9_cast = linear(bias = var_156_to_fp16, weight = var_155_to_fp16, x = var_146_cast); tensor x_17_mode_0 = const()[name = tensor("x_17_mode_0"), val = tensor("EXACT")]; tensor x_17_cast = gelu(mode = x_17_mode_0, x = input_9_cast); tensor var_161_to_fp16 = const()[name = tensor("op_161_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(4592384)))]; tensor var_162_to_fp16 = const()[name = tensor("op_162_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5772096)))]; tensor var_163_cast = linear(bias = var_162_to_fp16, weight = var_161_to_fp16, x = x_17_cast); tensor x_19_cast = add(x = x_13_cast, y = var_163_cast); tensor var_171 = const()[name = tensor("op_171"), val = tensor(-1)]; tensor var_188_axes_0 = const()[name = tensor("op_188_axes_0"), val = tensor([-1])]; tensor blocks_1_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_1_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5772928)))]; tensor blocks_1_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_1_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5773760)))]; tensor var_177_to_fp16 = const()[name = tensor("op_177_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_188_cast = layer_norm(axes = var_188_axes_0, beta = blocks_1_attn_ln_bias_to_fp16, epsilon = var_177_to_fp16, gamma = blocks_1_attn_ln_weight_to_fp16, x = x_19_cast); tensor var_199_to_fp16 = const()[name = tensor("op_199_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(5774592)))]; tensor var_200_to_fp16 = const()[name = tensor("op_200_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6069568)))]; tensor q_5_cast = linear(bias = var_200_to_fp16, weight = var_199_to_fp16, x = var_188_cast); tensor var_203_to_fp16 = const()[name = tensor("op_203_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6070400)))]; tensor k_5_bias_0_to_fp16 = const()[name = tensor("k_5_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6365376)))]; tensor k_5_cast = linear(bias = k_5_bias_0_to_fp16, weight = var_203_to_fp16, x = var_188_cast); tensor var_207_to_fp16 = const()[name = tensor("op_207_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6366208)))]; tensor var_208_to_fp16 = const()[name = tensor("op_208_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6661184)))]; tensor v_5_cast = linear(bias = var_208_to_fp16, weight = var_207_to_fp16, x = var_188_cast); tensor var_216 = const()[name = tensor("op_216"), val = tensor([1, 1500, 6, -1])]; tensor var_217_cast = reshape(shape = var_216, x = q_5_cast); tensor const_30_to_fp16 = const()[name = tensor("const_30_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_7_cast = mul(x = var_217_cast, y = const_30_to_fp16); tensor var_223 = const()[name = tensor("op_223"), val = tensor([1, 1500, 6, -1])]; tensor var_224_cast = reshape(shape = var_223, x = k_5_cast); tensor const_31_to_fp16 = const()[name = tensor("const_31_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_7_cast = mul(x = var_224_cast, y = const_31_to_fp16); tensor var_230 = const()[name = tensor("op_230"), val = tensor([1, 1500, 6, -1])]; tensor var_231_cast = reshape(shape = var_230, x = v_5_cast); tensor var_232 = const()[name = tensor("op_232"), val = tensor([0, 2, 1, 3])]; tensor qk_3_transpose_x_0 = const()[name = tensor("qk_3_transpose_x_0"), val = tensor(false)]; tensor qk_3_transpose_y_0 = const()[name = tensor("qk_3_transpose_y_0"), val = tensor(false)]; tensor transpose_10_perm_0 = const()[name = tensor("transpose_10_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_11_perm_0 = const()[name = tensor("transpose_11_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_25 = transpose(perm = transpose_11_perm_0, x = k_7_cast); tensor transpose_26 = transpose(perm = transpose_10_perm_0, x = q_7_cast); tensor qk_3_cast = matmul(transpose_x = qk_3_transpose_x_0, transpose_y = qk_3_transpose_y_0, x = transpose_26, y = transpose_25); tensor var_236_cast = softmax(axis = var_171, x = qk_3_cast); tensor var_238_transpose_x_0 = const()[name = tensor("op_238_transpose_x_0"), val = tensor(false)]; tensor var_238_transpose_y_0 = const()[name = tensor("op_238_transpose_y_0"), val = tensor(false)]; tensor transpose_27 = transpose(perm = var_232, x = var_231_cast); tensor var_238_cast = matmul(transpose_x = var_238_transpose_x_0, transpose_y = var_238_transpose_y_0, x = var_236_cast, y = transpose_27); tensor var_239 = const()[name = tensor("op_239"), val = tensor([0, 2, 1, 3])]; tensor concat_1 = const()[name = tensor("concat_1"), val = tensor([1, 1500, 384])]; tensor transpose_24 = transpose(perm = var_239, x = var_238_cast); tensor x_23_cast = reshape(shape = concat_1, x = transpose_24); tensor var_244_to_fp16 = const()[name = tensor("op_244_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6662016)))]; tensor var_245_to_fp16 = const()[name = tensor("op_245_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6956992)))]; tensor var_246_cast = linear(bias = var_245_to_fp16, weight = var_244_to_fp16, x = x_23_cast); tensor x_25_cast = add(x = x_19_cast, y = var_246_cast); tensor var_252_axes_0 = const()[name = tensor("op_252_axes_0"), val = tensor([-1])]; tensor blocks_1_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6957824)))]; tensor blocks_1_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6958656)))]; tensor var_252_cast = layer_norm(axes = var_252_axes_0, beta = blocks_1_mlp_ln_bias_to_fp16, epsilon = var_177_to_fp16, gamma = blocks_1_mlp_ln_weight_to_fp16, x = x_25_cast); tensor var_261_to_fp16 = const()[name = tensor("op_261_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6959488)))]; tensor var_262_to_fp16 = const()[name = tensor("op_262_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8139200)))]; tensor input_17_cast = linear(bias = var_262_to_fp16, weight = var_261_to_fp16, x = var_252_cast); tensor x_29_mode_0 = const()[name = tensor("x_29_mode_0"), val = tensor("EXACT")]; tensor x_29_cast = gelu(mode = x_29_mode_0, x = input_17_cast); tensor var_267_to_fp16 = const()[name = tensor("op_267_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(8142336)))]; tensor var_268_to_fp16 = const()[name = tensor("op_268_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9322048)))]; tensor var_269_cast = linear(bias = var_268_to_fp16, weight = var_267_to_fp16, x = x_29_cast); tensor x_31_cast = add(x = x_25_cast, y = var_269_cast); tensor var_277 = const()[name = tensor("op_277"), val = tensor(-1)]; tensor var_294_axes_0 = const()[name = tensor("op_294_axes_0"), val = tensor([-1])]; tensor blocks_2_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_2_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9322880)))]; tensor blocks_2_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_2_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9323712)))]; tensor var_283_to_fp16 = const()[name = tensor("op_283_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_294_cast = layer_norm(axes = var_294_axes_0, beta = blocks_2_attn_ln_bias_to_fp16, epsilon = var_283_to_fp16, gamma = blocks_2_attn_ln_weight_to_fp16, x = x_31_cast); tensor var_305_to_fp16 = const()[name = tensor("op_305_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9324544)))]; tensor var_306_to_fp16 = const()[name = tensor("op_306_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9619520)))]; tensor q_9_cast = linear(bias = var_306_to_fp16, weight = var_305_to_fp16, x = var_294_cast); tensor var_309_to_fp16 = const()[name = tensor("op_309_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9620352)))]; tensor k_9_bias_0_to_fp16 = const()[name = tensor("k_9_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9915328)))]; tensor k_9_cast = linear(bias = k_9_bias_0_to_fp16, weight = var_309_to_fp16, x = var_294_cast); tensor var_313_to_fp16 = const()[name = tensor("op_313_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9916160)))]; tensor var_314_to_fp16 = const()[name = tensor("op_314_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10211136)))]; tensor v_9_cast = linear(bias = var_314_to_fp16, weight = var_313_to_fp16, x = var_294_cast); tensor var_322 = const()[name = tensor("op_322"), val = tensor([1, 1500, 6, -1])]; tensor var_323_cast = reshape(shape = var_322, x = q_9_cast); tensor const_32_to_fp16 = const()[name = tensor("const_32_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_11_cast = mul(x = var_323_cast, y = const_32_to_fp16); tensor var_329 = const()[name = tensor("op_329"), val = tensor([1, 1500, 6, -1])]; tensor var_330_cast = reshape(shape = var_329, x = k_9_cast); tensor const_33_to_fp16 = const()[name = tensor("const_33_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_11_cast = mul(x = var_330_cast, y = const_33_to_fp16); tensor var_336 = const()[name = tensor("op_336"), val = tensor([1, 1500, 6, -1])]; tensor var_337_cast = reshape(shape = var_336, x = v_9_cast); tensor var_338 = const()[name = tensor("op_338"), val = tensor([0, 2, 1, 3])]; tensor qk_5_transpose_x_0 = const()[name = tensor("qk_5_transpose_x_0"), val = tensor(false)]; tensor qk_5_transpose_y_0 = const()[name = tensor("qk_5_transpose_y_0"), val = tensor(false)]; tensor transpose_12_perm_0 = const()[name = tensor("transpose_12_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_13_perm_0 = const()[name = tensor("transpose_13_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_21 = transpose(perm = transpose_13_perm_0, x = k_11_cast); tensor transpose_22 = transpose(perm = transpose_12_perm_0, x = q_11_cast); tensor qk_5_cast = matmul(transpose_x = qk_5_transpose_x_0, transpose_y = qk_5_transpose_y_0, x = transpose_22, y = transpose_21); tensor var_342_cast = softmax(axis = var_277, x = qk_5_cast); tensor var_344_transpose_x_0 = const()[name = tensor("op_344_transpose_x_0"), val = tensor(false)]; tensor var_344_transpose_y_0 = const()[name = tensor("op_344_transpose_y_0"), val = tensor(false)]; tensor transpose_23 = transpose(perm = var_338, x = var_337_cast); tensor var_344_cast = matmul(transpose_x = var_344_transpose_x_0, transpose_y = var_344_transpose_y_0, x = var_342_cast, y = transpose_23); tensor var_345 = const()[name = tensor("op_345"), val = tensor([0, 2, 1, 3])]; tensor concat_2 = const()[name = tensor("concat_2"), val = tensor([1, 1500, 384])]; tensor transpose_20 = transpose(perm = var_345, x = var_344_cast); tensor x_35_cast = reshape(shape = concat_2, x = transpose_20); tensor var_350_to_fp16 = const()[name = tensor("op_350_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10211968)))]; tensor var_351_to_fp16 = const()[name = tensor("op_351_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10506944)))]; tensor var_352_cast = linear(bias = var_351_to_fp16, weight = var_350_to_fp16, x = x_35_cast); tensor x_37_cast = add(x = x_31_cast, y = var_352_cast); tensor var_358_axes_0 = const()[name = tensor("op_358_axes_0"), val = tensor([-1])]; tensor blocks_2_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10507776)))]; tensor blocks_2_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10508608)))]; tensor var_358_cast = layer_norm(axes = var_358_axes_0, beta = blocks_2_mlp_ln_bias_to_fp16, epsilon = var_283_to_fp16, gamma = blocks_2_mlp_ln_weight_to_fp16, x = x_37_cast); tensor var_367_to_fp16 = const()[name = tensor("op_367_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(10509440)))]; tensor var_368_to_fp16 = const()[name = tensor("op_368_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11689152)))]; tensor input_25_cast = linear(bias = var_368_to_fp16, weight = var_367_to_fp16, x = var_358_cast); tensor x_41_mode_0 = const()[name = tensor("x_41_mode_0"), val = tensor("EXACT")]; tensor x_41_cast = gelu(mode = x_41_mode_0, x = input_25_cast); tensor var_373_to_fp16 = const()[name = tensor("op_373_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11692288)))]; tensor var_374_to_fp16 = const()[name = tensor("op_374_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12872000)))]; tensor var_375_cast = linear(bias = var_374_to_fp16, weight = var_373_to_fp16, x = x_41_cast); tensor x_43_cast = add(x = x_37_cast, y = var_375_cast); tensor var_383 = const()[name = tensor("op_383"), val = tensor(-1)]; tensor var_400_axes_0 = const()[name = tensor("op_400_axes_0"), val = tensor([-1])]; tensor blocks_3_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_3_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12872832)))]; tensor blocks_3_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_3_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12873664)))]; tensor var_389_to_fp16 = const()[name = tensor("op_389_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_400_cast = layer_norm(axes = var_400_axes_0, beta = blocks_3_attn_ln_bias_to_fp16, epsilon = var_389_to_fp16, gamma = blocks_3_attn_ln_weight_to_fp16, x = x_43_cast); tensor var_411_to_fp16 = const()[name = tensor("op_411_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(12874496)))]; tensor var_412_to_fp16 = const()[name = tensor("op_412_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13169472)))]; tensor q_13_cast = linear(bias = var_412_to_fp16, weight = var_411_to_fp16, x = var_400_cast); tensor var_415_to_fp16 = const()[name = tensor("op_415_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13170304)))]; tensor k_13_bias_0_to_fp16 = const()[name = tensor("k_13_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13465280)))]; tensor k_13_cast = linear(bias = k_13_bias_0_to_fp16, weight = var_415_to_fp16, x = var_400_cast); tensor var_419_to_fp16 = const()[name = tensor("op_419_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13466112)))]; tensor var_420_to_fp16 = const()[name = tensor("op_420_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13761088)))]; tensor v_13_cast = linear(bias = var_420_to_fp16, weight = var_419_to_fp16, x = var_400_cast); tensor var_428 = const()[name = tensor("op_428"), val = tensor([1, 1500, 6, -1])]; tensor var_429_cast = reshape(shape = var_428, x = q_13_cast); tensor const_34_to_fp16 = const()[name = tensor("const_34_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_cast = mul(x = var_429_cast, y = const_34_to_fp16); tensor var_435 = const()[name = tensor("op_435"), val = tensor([1, 1500, 6, -1])]; tensor var_436_cast = reshape(shape = var_435, x = k_13_cast); tensor const_35_to_fp16 = const()[name = tensor("const_35_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_cast = mul(x = var_436_cast, y = const_35_to_fp16); tensor var_442 = const()[name = tensor("op_442"), val = tensor([1, 1500, 6, -1])]; tensor var_443_cast = reshape(shape = var_442, x = v_13_cast); tensor var_444 = const()[name = tensor("op_444"), val = tensor([0, 2, 1, 3])]; tensor qk_transpose_x_0 = const()[name = tensor("qk_transpose_x_0"), val = tensor(false)]; tensor qk_transpose_y_0 = const()[name = tensor("qk_transpose_y_0"), val = tensor(false)]; tensor transpose_14_perm_0 = const()[name = tensor("transpose_14_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_15_perm_0 = const()[name = tensor("transpose_15_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_17 = transpose(perm = transpose_15_perm_0, x = k_cast); tensor transpose_18 = transpose(perm = transpose_14_perm_0, x = q_cast); tensor qk_cast = matmul(transpose_x = qk_transpose_x_0, transpose_y = qk_transpose_y_0, x = transpose_18, y = transpose_17); tensor var_448_cast = softmax(axis = var_383, x = qk_cast); tensor var_450_transpose_x_0 = const()[name = tensor("op_450_transpose_x_0"), val = tensor(false)]; tensor var_450_transpose_y_0 = const()[name = tensor("op_450_transpose_y_0"), val = tensor(false)]; tensor transpose_19 = transpose(perm = var_444, x = var_443_cast); tensor var_450_cast = matmul(transpose_x = var_450_transpose_x_0, transpose_y = var_450_transpose_y_0, x = var_448_cast, y = transpose_19); tensor var_451 = const()[name = tensor("op_451"), val = tensor([0, 2, 1, 3])]; tensor concat_3 = const()[name = tensor("concat_3"), val = tensor([1, 1500, 384])]; tensor transpose_16 = transpose(perm = var_451, x = var_450_cast); tensor x_47_cast = reshape(shape = concat_3, x = transpose_16); tensor var_456_to_fp16 = const()[name = tensor("op_456_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(13761920)))]; tensor var_457_to_fp16 = const()[name = tensor("op_457_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14056896)))]; tensor var_458_cast = linear(bias = var_457_to_fp16, weight = var_456_to_fp16, x = x_47_cast); tensor x_49_cast = add(x = x_43_cast, y = var_458_cast); tensor var_464_axes_0 = const()[name = tensor("op_464_axes_0"), val = tensor([-1])]; tensor blocks_3_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14057728)))]; tensor blocks_3_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14058560)))]; tensor var_464_cast = layer_norm(axes = var_464_axes_0, beta = blocks_3_mlp_ln_bias_to_fp16, epsilon = var_389_to_fp16, gamma = blocks_3_mlp_ln_weight_to_fp16, x = x_49_cast); tensor var_473_to_fp16 = const()[name = tensor("op_473_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14059392)))]; tensor var_474_to_fp16 = const()[name = tensor("op_474_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15239104)))]; tensor input_33_cast = linear(bias = var_474_to_fp16, weight = var_473_to_fp16, x = var_464_cast); tensor x_53_mode_0 = const()[name = tensor("x_53_mode_0"), val = tensor("EXACT")]; tensor x_53_cast = gelu(mode = x_53_mode_0, x = input_33_cast); tensor var_479_to_fp16 = const()[name = tensor("op_479_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(15242240)))]; tensor var_480_to_fp16 = const()[name = tensor("op_480_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16421952)))]; tensor var_481_cast = linear(bias = var_480_to_fp16, weight = var_479_to_fp16, x = x_53_cast); tensor x_cast = add(x = x_49_cast, y = var_481_cast); tensor var_494_axes_0 = const()[name = tensor("op_494_axes_0"), val = tensor([-1])]; tensor ln_post_weight_to_fp16 = const()[name = tensor("ln_post_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16422784)))]; tensor ln_post_bias_to_fp16 = const()[name = tensor("ln_post_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16423616)))]; tensor var_485_to_fp16 = const()[name = tensor("op_485_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_494_cast = layer_norm(axes = var_494_axes_0, beta = ln_post_bias_to_fp16, epsilon = var_485_to_fp16, gamma = ln_post_weight_to_fp16, x = x_cast); tensor var_494_cast_to_fp32_dtype_0 = const()[name = tensor("op_494_cast_to_fp32_dtype_0"), val = tensor("fp32")]; tensor output = cast(dtype = var_494_cast_to_fp32_dtype_0, x = var_494_cast); } -> (output); }