diff --git "a/ggml-medium.en-encoder.mlmodelc/model.mil" "b/ggml-medium.en-encoder.mlmodelc/model.mil" new file mode 100644--- /dev/null +++ "b/ggml-medium.en-encoder.mlmodelc/model.mil" @@ -0,0 +1,1455 @@ +program(1.0) +[buildInfo = dict, tensor>({{"coremlc-component-MIL", "4.28.4"}, {"coremlc-version", "1436.100.10"}})] +{ + func main(tensor logmel_data) { + tensor var_56 = const()[name = tensor("op_56"), val = tensor(1)]; + tensor var_64 = const()[name = tensor("op_64"), val = tensor([1])]; + tensor var_66 = const()[name = tensor("op_66"), val = tensor([1])]; + tensor var_68_pad_type_0 = const()[name = tensor("op_68_pad_type_0"), val = tensor("custom")]; + tensor var_68_pad_0 = const()[name = tensor("op_68_pad_0"), val = tensor([1, 1])]; + tensor logmel_data_to_fp16_dtype_0 = const()[name = tensor("logmel_data_to_fp16_dtype_0"), val = tensor("fp16")]; + tensor weight_3_to_fp16 = const()[name = tensor("weight_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; + tensor bias_3_to_fp16 = const()[name = tensor("bias_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(491648)))]; + tensor cast_727 = cast(dtype = logmel_data_to_fp16_dtype_0, x = logmel_data); + tensor var_68_cast = conv(bias = bias_3_to_fp16, dilations = var_66, groups = var_56, pad = var_68_pad_0, pad_type = var_68_pad_type_0, strides = var_64, weight = weight_3_to_fp16, x = cast_727); + tensor input_1_mode_0 = const()[name = tensor("input_1_mode_0"), val = tensor("EXACT")]; + tensor input_1_cast = gelu(mode = input_1_mode_0, x = var_68_cast); + tensor var_72 = const()[name = tensor("op_72"), val = tensor(1)]; + tensor var_81 = const()[name = tensor("op_81"), val = tensor([2])]; + tensor var_83 = const()[name = tensor("op_83"), val = tensor([1])]; + tensor var_85_pad_type_0 = const()[name = tensor("op_85_pad_type_0"), val = tensor("custom")]; + tensor var_85_pad_0 = const()[name = tensor("op_85_pad_0"), val = tensor([1, 1])]; + tensor weight_7_to_fp16 = const()[name = tensor("weight_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(493760)))]; + tensor bias_7_to_fp16 = const()[name = tensor("bias_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6785280)))]; + tensor var_85_cast = conv(bias = bias_7_to_fp16, dilations = var_83, groups = var_72, pad = var_85_pad_0, pad_type = var_85_pad_type_0, strides = var_81, weight = weight_7_to_fp16, x = input_1_cast); + tensor x_3_mode_0 = const()[name = tensor("x_3_mode_0"), val = tensor("EXACT")]; + tensor x_3_cast = gelu(mode = x_3_mode_0, x = var_85_cast); + tensor var_90 = const()[name = tensor("op_90"), val = tensor([0, 2, 1])]; + tensor positional_embedding_to_fp16 = const()[name = tensor("positional_embedding_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6787392)))]; + tensor transpose_192 = transpose(perm = var_90, x = x_3_cast); + tensor var_93_cast = add(x = transpose_192, y = positional_embedding_to_fp16); + tensor var_106 = const()[name = tensor("op_106"), val = tensor(-1)]; + tensor var_123_axes_0 = const()[name = tensor("op_123_axes_0"), val = tensor([-1])]; + tensor blocks_0_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_0_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9859456)))]; + tensor blocks_0_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_0_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9861568)))]; + tensor var_112_to_fp16 = const()[name = tensor("op_112_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_123_cast = layer_norm(axes = var_123_axes_0, beta = blocks_0_attn_ln_bias_to_fp16, epsilon = var_112_to_fp16, gamma = blocks_0_attn_ln_weight_to_fp16, x = var_93_cast); + tensor var_134_to_fp16 = const()[name = tensor("op_134_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9863680)))]; + tensor var_135_to_fp16 = const()[name = tensor("op_135_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11960896)))]; + tensor q_1_cast = linear(bias = var_135_to_fp16, weight = var_134_to_fp16, x = var_123_cast); + tensor var_138_to_fp16 = const()[name = tensor("op_138_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11963008)))]; + tensor k_1_bias_0_to_fp16 = const()[name = tensor("k_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14060224)))]; + tensor k_1_cast = linear(bias = k_1_bias_0_to_fp16, weight = var_138_to_fp16, x = var_123_cast); + tensor var_142_to_fp16 = const()[name = tensor("op_142_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14062336)))]; + tensor var_143_to_fp16 = const()[name = tensor("op_143_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16159552)))]; + tensor v_1_cast = linear(bias = var_143_to_fp16, weight = var_142_to_fp16, x = var_123_cast); + tensor var_151 = const()[name = tensor("op_151"), val = tensor([1, 1500, 16, -1])]; + tensor var_152_cast = reshape(shape = var_151, x = q_1_cast); + tensor const_168_to_fp16 = const()[name = tensor("const_168_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_3_cast = mul(x = var_152_cast, y = const_168_to_fp16); + tensor var_158 = const()[name = tensor("op_158"), val = tensor([1, 1500, 16, -1])]; + tensor var_159_cast = reshape(shape = var_158, x = k_1_cast); + tensor const_169_to_fp16 = const()[name = tensor("const_169_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_3_cast = mul(x = var_159_cast, y = const_169_to_fp16); + tensor var_165 = const()[name = tensor("op_165"), val = tensor([1, 1500, 16, -1])]; + tensor var_166_cast = reshape(shape = var_165, x = v_1_cast); + tensor var_167 = const()[name = tensor("op_167"), val = tensor([0, 2, 1, 3])]; + tensor qk_1_transpose_x_0 = const()[name = tensor("qk_1_transpose_x_0"), val = tensor(false)]; + tensor qk_1_transpose_y_0 = const()[name = tensor("qk_1_transpose_y_0"), val = tensor(false)]; + tensor transpose_48_perm_0 = const()[name = tensor("transpose_48_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_49_perm_0 = const()[name = tensor("transpose_49_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_189 = transpose(perm = transpose_49_perm_0, x = k_3_cast); + tensor transpose_190 = transpose(perm = transpose_48_perm_0, x = q_3_cast); + tensor qk_1_cast = matmul(transpose_x = qk_1_transpose_x_0, transpose_y = qk_1_transpose_y_0, x = transpose_190, y = transpose_189); + tensor var_171_cast = softmax(axis = var_106, x = qk_1_cast); + tensor var_173_transpose_x_0 = const()[name = tensor("op_173_transpose_x_0"), val = tensor(false)]; + tensor var_173_transpose_y_0 = const()[name = tensor("op_173_transpose_y_0"), val = tensor(false)]; + tensor transpose_191 = transpose(perm = var_167, x = var_166_cast); + tensor var_173_cast = matmul(transpose_x = var_173_transpose_x_0, transpose_y = var_173_transpose_y_0, x = var_171_cast, y = transpose_191); + tensor var_174 = const()[name = tensor("op_174"), val = tensor([0, 2, 1, 3])]; + tensor concat_0 = const()[name = tensor("concat_0"), val = tensor([1, 1500, 1024])]; + tensor transpose_188 = transpose(perm = var_174, x = var_173_cast); + tensor x_11_cast = reshape(shape = concat_0, x = transpose_188); + tensor var_179_to_fp16 = const()[name = tensor("op_179_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16161664)))]; + tensor var_180_to_fp16 = const()[name = tensor("op_180_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18258880)))]; + tensor var_181_cast = linear(bias = var_180_to_fp16, weight = var_179_to_fp16, x = x_11_cast); + tensor x_13_cast = add(x = var_93_cast, y = var_181_cast); + tensor var_187_axes_0 = const()[name = tensor("op_187_axes_0"), val = tensor([-1])]; + tensor blocks_0_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18260992)))]; + tensor blocks_0_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18263104)))]; + tensor var_187_cast = layer_norm(axes = var_187_axes_0, beta = blocks_0_mlp_ln_bias_to_fp16, epsilon = var_112_to_fp16, gamma = blocks_0_mlp_ln_weight_to_fp16, x = x_13_cast); + tensor var_196_to_fp16 = const()[name = tensor("op_196_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18265216)))]; + tensor var_197_to_fp16 = const()[name = tensor("op_197_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26653888)))]; + tensor input_9_cast = linear(bias = var_197_to_fp16, weight = var_196_to_fp16, x = var_187_cast); + tensor x_17_mode_0 = const()[name = tensor("x_17_mode_0"), val = tensor("EXACT")]; + tensor x_17_cast = gelu(mode = x_17_mode_0, x = input_9_cast); + tensor var_202_to_fp16 = const()[name = tensor("op_202_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26662144)))]; + tensor var_203_to_fp16 = const()[name = tensor("op_203_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35050816)))]; + tensor var_204_cast = linear(bias = var_203_to_fp16, weight = var_202_to_fp16, x = x_17_cast); + tensor x_19_cast = add(x = x_13_cast, y = var_204_cast); + tensor var_213 = const()[name = tensor("op_213"), val = tensor(-1)]; + tensor var_230_axes_0 = const()[name = tensor("op_230_axes_0"), val = tensor([-1])]; + tensor blocks_1_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_1_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35052928)))]; + tensor blocks_1_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_1_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35055040)))]; + tensor var_219_to_fp16 = const()[name = tensor("op_219_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_230_cast = layer_norm(axes = var_230_axes_0, beta = blocks_1_attn_ln_bias_to_fp16, epsilon = var_219_to_fp16, gamma = blocks_1_attn_ln_weight_to_fp16, x = x_19_cast); + tensor var_241_to_fp16 = const()[name = tensor("op_241_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35057152)))]; + tensor var_242_to_fp16 = const()[name = tensor("op_242_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37154368)))]; + tensor q_5_cast = linear(bias = var_242_to_fp16, weight = var_241_to_fp16, x = var_230_cast); + tensor var_245_to_fp16 = const()[name = tensor("op_245_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37156480)))]; + tensor k_5_bias_0_to_fp16 = const()[name = tensor("k_5_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39253696)))]; + tensor k_5_cast = linear(bias = k_5_bias_0_to_fp16, weight = var_245_to_fp16, x = var_230_cast); + tensor var_249_to_fp16 = const()[name = tensor("op_249_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39255808)))]; + tensor var_250_to_fp16 = const()[name = tensor("op_250_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41353024)))]; + tensor v_5_cast = linear(bias = var_250_to_fp16, weight = var_249_to_fp16, x = var_230_cast); + tensor var_258 = const()[name = tensor("op_258"), val = tensor([1, 1500, 16, -1])]; + tensor var_259_cast = reshape(shape = var_258, x = q_5_cast); + tensor const_170_to_fp16 = const()[name = tensor("const_170_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_7_cast = mul(x = var_259_cast, y = const_170_to_fp16); + tensor var_265 = const()[name = tensor("op_265"), val = tensor([1, 1500, 16, -1])]; + tensor var_266_cast = reshape(shape = var_265, x = k_5_cast); + tensor const_171_to_fp16 = const()[name = tensor("const_171_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_7_cast = mul(x = var_266_cast, y = const_171_to_fp16); + tensor var_272 = const()[name = tensor("op_272"), val = tensor([1, 1500, 16, -1])]; + tensor var_273_cast = reshape(shape = var_272, x = v_5_cast); + tensor var_274 = const()[name = tensor("op_274"), val = tensor([0, 2, 1, 3])]; + tensor qk_3_transpose_x_0 = const()[name = tensor("qk_3_transpose_x_0"), val = tensor(false)]; + tensor qk_3_transpose_y_0 = const()[name = tensor("qk_3_transpose_y_0"), val = tensor(false)]; + tensor transpose_50_perm_0 = const()[name = tensor("transpose_50_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_51_perm_0 = const()[name = tensor("transpose_51_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_185 = transpose(perm = transpose_51_perm_0, x = k_7_cast); + tensor transpose_186 = transpose(perm = transpose_50_perm_0, x = q_7_cast); + tensor qk_3_cast = matmul(transpose_x = qk_3_transpose_x_0, transpose_y = qk_3_transpose_y_0, x = transpose_186, y = transpose_185); + tensor var_278_cast = softmax(axis = var_213, x = qk_3_cast); + tensor var_280_transpose_x_0 = const()[name = tensor("op_280_transpose_x_0"), val = tensor(false)]; + tensor var_280_transpose_y_0 = const()[name = tensor("op_280_transpose_y_0"), val = tensor(false)]; + tensor transpose_187 = transpose(perm = var_274, x = var_273_cast); + tensor var_280_cast = matmul(transpose_x = var_280_transpose_x_0, transpose_y = var_280_transpose_y_0, x = var_278_cast, y = transpose_187); + tensor var_281 = const()[name = tensor("op_281"), val = tensor([0, 2, 1, 3])]; + tensor concat_1 = const()[name = tensor("concat_1"), val = tensor([1, 1500, 1024])]; + tensor transpose_184 = transpose(perm = var_281, x = var_280_cast); + tensor x_23_cast = reshape(shape = concat_1, x = transpose_184); + tensor var_286_to_fp16 = const()[name = tensor("op_286_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41355136)))]; + tensor var_287_to_fp16 = const()[name = tensor("op_287_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43452352)))]; + tensor var_288_cast = linear(bias = var_287_to_fp16, weight = var_286_to_fp16, x = x_23_cast); + tensor x_25_cast = add(x = x_19_cast, y = var_288_cast); + tensor var_294_axes_0 = const()[name = tensor("op_294_axes_0"), val = tensor([-1])]; + tensor blocks_1_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43454464)))]; + tensor blocks_1_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43456576)))]; + tensor var_294_cast = layer_norm(axes = var_294_axes_0, beta = blocks_1_mlp_ln_bias_to_fp16, epsilon = var_219_to_fp16, gamma = blocks_1_mlp_ln_weight_to_fp16, x = x_25_cast); + tensor var_303_to_fp16 = const()[name = tensor("op_303_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43458688)))]; + tensor var_304_to_fp16 = const()[name = tensor("op_304_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(51847360)))]; + tensor input_17_cast = linear(bias = var_304_to_fp16, weight = var_303_to_fp16, x = var_294_cast); + tensor x_29_mode_0 = const()[name = tensor("x_29_mode_0"), val = tensor("EXACT")]; + tensor x_29_cast = gelu(mode = x_29_mode_0, x = input_17_cast); + tensor var_309_to_fp16 = const()[name = tensor("op_309_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(51855616)))]; + tensor var_310_to_fp16 = const()[name = tensor("op_310_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60244288)))]; + tensor var_311_cast = linear(bias = var_310_to_fp16, weight = var_309_to_fp16, x = x_29_cast); + tensor x_31_cast = add(x = x_25_cast, y = var_311_cast); + tensor var_320 = const()[name = tensor("op_320"), val = tensor(-1)]; + tensor var_337_axes_0 = const()[name = tensor("op_337_axes_0"), val = tensor([-1])]; + tensor blocks_2_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_2_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60246400)))]; + tensor blocks_2_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_2_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60248512)))]; + tensor var_326_to_fp16 = const()[name = tensor("op_326_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_337_cast = layer_norm(axes = var_337_axes_0, beta = blocks_2_attn_ln_bias_to_fp16, epsilon = var_326_to_fp16, gamma = blocks_2_attn_ln_weight_to_fp16, x = x_31_cast); + tensor var_348_to_fp16 = const()[name = tensor("op_348_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60250624)))]; + tensor var_349_to_fp16 = const()[name = tensor("op_349_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(62347840)))]; + tensor q_9_cast = linear(bias = var_349_to_fp16, weight = var_348_to_fp16, x = var_337_cast); + tensor var_352_to_fp16 = const()[name = tensor("op_352_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(62349952)))]; + tensor k_9_bias_0_to_fp16 = const()[name = tensor("k_9_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64447168)))]; + tensor k_9_cast = linear(bias = k_9_bias_0_to_fp16, weight = var_352_to_fp16, x = var_337_cast); + tensor var_356_to_fp16 = const()[name = tensor("op_356_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64449280)))]; + tensor var_357_to_fp16 = const()[name = tensor("op_357_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(66546496)))]; + tensor v_9_cast = linear(bias = var_357_to_fp16, weight = var_356_to_fp16, x = var_337_cast); + tensor var_365 = const()[name = tensor("op_365"), val = tensor([1, 1500, 16, -1])]; + tensor var_366_cast = reshape(shape = var_365, x = q_9_cast); + tensor const_172_to_fp16 = const()[name = tensor("const_172_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_11_cast = mul(x = var_366_cast, y = const_172_to_fp16); + tensor var_372 = const()[name = tensor("op_372"), val = tensor([1, 1500, 16, -1])]; + tensor var_373_cast = reshape(shape = var_372, x = k_9_cast); + tensor const_173_to_fp16 = const()[name = tensor("const_173_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_11_cast = mul(x = var_373_cast, y = const_173_to_fp16); + tensor var_379 = const()[name = tensor("op_379"), val = tensor([1, 1500, 16, -1])]; + tensor var_380_cast = reshape(shape = var_379, x = v_9_cast); + tensor var_381 = const()[name = tensor("op_381"), val = tensor([0, 2, 1, 3])]; + tensor qk_5_transpose_x_0 = const()[name = tensor("qk_5_transpose_x_0"), val = tensor(false)]; + tensor qk_5_transpose_y_0 = const()[name = tensor("qk_5_transpose_y_0"), val = tensor(false)]; + tensor transpose_52_perm_0 = const()[name = tensor("transpose_52_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_53_perm_0 = const()[name = tensor("transpose_53_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_181 = transpose(perm = transpose_53_perm_0, x = k_11_cast); + tensor transpose_182 = transpose(perm = transpose_52_perm_0, x = q_11_cast); + tensor qk_5_cast = matmul(transpose_x = qk_5_transpose_x_0, transpose_y = qk_5_transpose_y_0, x = transpose_182, y = transpose_181); + tensor var_385_cast = softmax(axis = var_320, x = qk_5_cast); + tensor var_387_transpose_x_0 = const()[name = tensor("op_387_transpose_x_0"), val = tensor(false)]; + tensor var_387_transpose_y_0 = const()[name = tensor("op_387_transpose_y_0"), val = tensor(false)]; + tensor transpose_183 = transpose(perm = var_381, x = var_380_cast); + tensor var_387_cast = matmul(transpose_x = var_387_transpose_x_0, transpose_y = var_387_transpose_y_0, x = var_385_cast, y = transpose_183); + tensor var_388 = const()[name = tensor("op_388"), val = tensor([0, 2, 1, 3])]; + tensor concat_2 = const()[name = tensor("concat_2"), val = tensor([1, 1500, 1024])]; + tensor transpose_180 = transpose(perm = var_388, x = var_387_cast); + tensor x_35_cast = reshape(shape = concat_2, x = transpose_180); + tensor var_393_to_fp16 = const()[name = tensor("op_393_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(66548608)))]; + tensor var_394_to_fp16 = const()[name = tensor("op_394_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68645824)))]; + tensor var_395_cast = linear(bias = var_394_to_fp16, weight = var_393_to_fp16, x = x_35_cast); + tensor x_37_cast = add(x = x_31_cast, y = var_395_cast); + tensor var_401_axes_0 = const()[name = tensor("op_401_axes_0"), val = tensor([-1])]; + tensor blocks_2_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68647936)))]; + tensor blocks_2_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68650048)))]; + tensor var_401_cast = layer_norm(axes = var_401_axes_0, beta = blocks_2_mlp_ln_bias_to_fp16, epsilon = var_326_to_fp16, gamma = blocks_2_mlp_ln_weight_to_fp16, x = x_37_cast); + tensor var_410_to_fp16 = const()[name = tensor("op_410_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68652160)))]; + tensor var_411_to_fp16 = const()[name = tensor("op_411_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(77040832)))]; + tensor input_25_cast = linear(bias = var_411_to_fp16, weight = var_410_to_fp16, x = var_401_cast); + tensor x_41_mode_0 = const()[name = tensor("x_41_mode_0"), val = tensor("EXACT")]; + tensor x_41_cast = gelu(mode = x_41_mode_0, x = input_25_cast); + tensor var_416_to_fp16 = const()[name = tensor("op_416_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(77049088)))]; + tensor var_417_to_fp16 = const()[name = tensor("op_417_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85437760)))]; + tensor var_418_cast = linear(bias = var_417_to_fp16, weight = var_416_to_fp16, x = x_41_cast); + tensor x_43_cast = add(x = x_37_cast, y = var_418_cast); + tensor var_427 = const()[name = tensor("op_427"), val = tensor(-1)]; + tensor var_444_axes_0 = const()[name = tensor("op_444_axes_0"), val = tensor([-1])]; + tensor blocks_3_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_3_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85439872)))]; + tensor blocks_3_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_3_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85441984)))]; + tensor var_433_to_fp16 = const()[name = tensor("op_433_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_444_cast = layer_norm(axes = var_444_axes_0, beta = blocks_3_attn_ln_bias_to_fp16, epsilon = var_433_to_fp16, gamma = blocks_3_attn_ln_weight_to_fp16, x = x_43_cast); + tensor var_455_to_fp16 = const()[name = tensor("op_455_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85444096)))]; + tensor var_456_to_fp16 = const()[name = tensor("op_456_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(87541312)))]; + tensor q_13_cast = linear(bias = var_456_to_fp16, weight = var_455_to_fp16, x = var_444_cast); + tensor var_459_to_fp16 = const()[name = tensor("op_459_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(87543424)))]; + tensor k_13_bias_0_to_fp16 = const()[name = tensor("k_13_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89640640)))]; + tensor k_13_cast = linear(bias = k_13_bias_0_to_fp16, weight = var_459_to_fp16, x = var_444_cast); + tensor var_463_to_fp16 = const()[name = tensor("op_463_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89642752)))]; + tensor var_464_to_fp16 = const()[name = tensor("op_464_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(91739968)))]; + tensor v_13_cast = linear(bias = var_464_to_fp16, weight = var_463_to_fp16, x = var_444_cast); + tensor var_472 = const()[name = tensor("op_472"), val = tensor([1, 1500, 16, -1])]; + tensor var_473_cast = reshape(shape = var_472, x = q_13_cast); + tensor const_174_to_fp16 = const()[name = tensor("const_174_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_15_cast = mul(x = var_473_cast, y = const_174_to_fp16); + tensor var_479 = const()[name = tensor("op_479"), val = tensor([1, 1500, 16, -1])]; + tensor var_480_cast = reshape(shape = var_479, x = k_13_cast); + tensor const_175_to_fp16 = const()[name = tensor("const_175_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_15_cast = mul(x = var_480_cast, y = const_175_to_fp16); + tensor var_486 = const()[name = tensor("op_486"), val = tensor([1, 1500, 16, -1])]; + tensor var_487_cast = reshape(shape = var_486, x = v_13_cast); + tensor var_488 = const()[name = tensor("op_488"), val = tensor([0, 2, 1, 3])]; + tensor qk_7_transpose_x_0 = const()[name = tensor("qk_7_transpose_x_0"), val = tensor(false)]; + tensor qk_7_transpose_y_0 = const()[name = tensor("qk_7_transpose_y_0"), val = tensor(false)]; + tensor transpose_54_perm_0 = const()[name = tensor("transpose_54_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_55_perm_0 = const()[name = tensor("transpose_55_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_177 = transpose(perm = transpose_55_perm_0, x = k_15_cast); + tensor transpose_178 = transpose(perm = transpose_54_perm_0, x = q_15_cast); + tensor qk_7_cast = matmul(transpose_x = qk_7_transpose_x_0, transpose_y = qk_7_transpose_y_0, x = transpose_178, y = transpose_177); + tensor var_492_cast = softmax(axis = var_427, x = qk_7_cast); + tensor var_494_transpose_x_0 = const()[name = tensor("op_494_transpose_x_0"), val = tensor(false)]; + tensor var_494_transpose_y_0 = const()[name = tensor("op_494_transpose_y_0"), val = tensor(false)]; + tensor transpose_179 = transpose(perm = var_488, x = var_487_cast); + tensor var_494_cast = matmul(transpose_x = var_494_transpose_x_0, transpose_y = var_494_transpose_y_0, x = var_492_cast, y = transpose_179); + tensor var_495 = const()[name = tensor("op_495"), val = tensor([0, 2, 1, 3])]; + tensor concat_3 = const()[name = tensor("concat_3"), val = tensor([1, 1500, 1024])]; + tensor transpose_176 = transpose(perm = var_495, x = var_494_cast); + tensor x_47_cast = reshape(shape = concat_3, x = transpose_176); + tensor var_500_to_fp16 = const()[name = tensor("op_500_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(91742080)))]; + tensor var_501_to_fp16 = const()[name = tensor("op_501_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93839296)))]; + tensor var_502_cast = linear(bias = var_501_to_fp16, weight = var_500_to_fp16, x = x_47_cast); + tensor x_49_cast = add(x = x_43_cast, y = var_502_cast); + tensor var_508_axes_0 = const()[name = tensor("op_508_axes_0"), val = tensor([-1])]; + tensor blocks_3_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93841408)))]; + tensor blocks_3_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93843520)))]; + tensor var_508_cast = layer_norm(axes = var_508_axes_0, beta = blocks_3_mlp_ln_bias_to_fp16, epsilon = var_433_to_fp16, gamma = blocks_3_mlp_ln_weight_to_fp16, x = x_49_cast); + tensor var_517_to_fp16 = const()[name = tensor("op_517_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93845632)))]; + tensor var_518_to_fp16 = const()[name = tensor("op_518_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102234304)))]; + tensor input_33_cast = linear(bias = var_518_to_fp16, weight = var_517_to_fp16, x = var_508_cast); + tensor x_53_mode_0 = const()[name = tensor("x_53_mode_0"), val = tensor("EXACT")]; + tensor x_53_cast = gelu(mode = x_53_mode_0, x = input_33_cast); + tensor var_523_to_fp16 = const()[name = tensor("op_523_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102242560)))]; + tensor var_524_to_fp16 = const()[name = tensor("op_524_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110631232)))]; + tensor var_525_cast = linear(bias = var_524_to_fp16, weight = var_523_to_fp16, x = x_53_cast); + tensor x_55_cast = add(x = x_49_cast, y = var_525_cast); + tensor var_534 = const()[name = tensor("op_534"), val = tensor(-1)]; + tensor var_551_axes_0 = const()[name = tensor("op_551_axes_0"), val = tensor([-1])]; + tensor blocks_4_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_4_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110633344)))]; + tensor blocks_4_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_4_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110635456)))]; + tensor var_540_to_fp16 = const()[name = tensor("op_540_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_551_cast = layer_norm(axes = var_551_axes_0, beta = blocks_4_attn_ln_bias_to_fp16, epsilon = var_540_to_fp16, gamma = blocks_4_attn_ln_weight_to_fp16, x = x_55_cast); + tensor var_562_to_fp16 = const()[name = tensor("op_562_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110637568)))]; + tensor var_563_to_fp16 = const()[name = tensor("op_563_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(112734784)))]; + tensor q_17_cast = linear(bias = var_563_to_fp16, weight = var_562_to_fp16, x = var_551_cast); + tensor var_566_to_fp16 = const()[name = tensor("op_566_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(112736896)))]; + tensor k_17_bias_0_to_fp16 = const()[name = tensor("k_17_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114834112)))]; + tensor k_17_cast = linear(bias = k_17_bias_0_to_fp16, weight = var_566_to_fp16, x = var_551_cast); + tensor var_570_to_fp16 = const()[name = tensor("op_570_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114836224)))]; + tensor var_571_to_fp16 = const()[name = tensor("op_571_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(116933440)))]; + tensor v_17_cast = linear(bias = var_571_to_fp16, weight = var_570_to_fp16, x = var_551_cast); + tensor var_579 = const()[name = tensor("op_579"), val = tensor([1, 1500, 16, -1])]; + tensor var_580_cast = reshape(shape = var_579, x = q_17_cast); + tensor const_176_to_fp16 = const()[name = tensor("const_176_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_19_cast = mul(x = var_580_cast, y = const_176_to_fp16); + tensor var_586 = const()[name = tensor("op_586"), val = tensor([1, 1500, 16, -1])]; + tensor var_587_cast = reshape(shape = var_586, x = k_17_cast); + tensor const_177_to_fp16 = const()[name = tensor("const_177_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_19_cast = mul(x = var_587_cast, y = const_177_to_fp16); + tensor var_593 = const()[name = tensor("op_593"), val = tensor([1, 1500, 16, -1])]; + tensor var_594_cast = reshape(shape = var_593, x = v_17_cast); + tensor var_595 = const()[name = tensor("op_595"), val = tensor([0, 2, 1, 3])]; + tensor qk_9_transpose_x_0 = const()[name = tensor("qk_9_transpose_x_0"), val = tensor(false)]; + tensor qk_9_transpose_y_0 = const()[name = tensor("qk_9_transpose_y_0"), val = tensor(false)]; + tensor transpose_56_perm_0 = const()[name = tensor("transpose_56_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_57_perm_0 = const()[name = tensor("transpose_57_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_173 = transpose(perm = transpose_57_perm_0, x = k_19_cast); + tensor transpose_174 = transpose(perm = transpose_56_perm_0, x = q_19_cast); + tensor qk_9_cast = matmul(transpose_x = qk_9_transpose_x_0, transpose_y = qk_9_transpose_y_0, x = transpose_174, y = transpose_173); + tensor var_599_cast = softmax(axis = var_534, x = qk_9_cast); + tensor var_601_transpose_x_0 = const()[name = tensor("op_601_transpose_x_0"), val = tensor(false)]; + tensor var_601_transpose_y_0 = const()[name = tensor("op_601_transpose_y_0"), val = tensor(false)]; + tensor transpose_175 = transpose(perm = var_595, x = var_594_cast); + tensor var_601_cast = matmul(transpose_x = var_601_transpose_x_0, transpose_y = var_601_transpose_y_0, x = var_599_cast, y = transpose_175); + tensor var_602 = const()[name = tensor("op_602"), val = tensor([0, 2, 1, 3])]; + tensor concat_4 = const()[name = tensor("concat_4"), val = tensor([1, 1500, 1024])]; + tensor transpose_172 = transpose(perm = var_602, x = var_601_cast); + tensor x_59_cast = reshape(shape = concat_4, x = transpose_172); + tensor var_607_to_fp16 = const()[name = tensor("op_607_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(116935552)))]; + tensor var_608_to_fp16 = const()[name = tensor("op_608_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119032768)))]; + tensor var_609_cast = linear(bias = var_608_to_fp16, weight = var_607_to_fp16, x = x_59_cast); + tensor x_61_cast = add(x = x_55_cast, y = var_609_cast); + tensor var_615_axes_0 = const()[name = tensor("op_615_axes_0"), val = tensor([-1])]; + tensor blocks_4_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119034880)))]; + tensor blocks_4_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119036992)))]; + tensor var_615_cast = layer_norm(axes = var_615_axes_0, beta = blocks_4_mlp_ln_bias_to_fp16, epsilon = var_540_to_fp16, gamma = blocks_4_mlp_ln_weight_to_fp16, x = x_61_cast); + tensor var_624_to_fp16 = const()[name = tensor("op_624_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119039104)))]; + tensor var_625_to_fp16 = const()[name = tensor("op_625_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127427776)))]; + tensor input_41_cast = linear(bias = var_625_to_fp16, weight = var_624_to_fp16, x = var_615_cast); + tensor x_65_mode_0 = const()[name = tensor("x_65_mode_0"), val = tensor("EXACT")]; + tensor x_65_cast = gelu(mode = x_65_mode_0, x = input_41_cast); + tensor var_630_to_fp16 = const()[name = tensor("op_630_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127436032)))]; + tensor var_631_to_fp16 = const()[name = tensor("op_631_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135824704)))]; + tensor var_632_cast = linear(bias = var_631_to_fp16, weight = var_630_to_fp16, x = x_65_cast); + tensor x_67_cast = add(x = x_61_cast, y = var_632_cast); + tensor var_641 = const()[name = tensor("op_641"), val = tensor(-1)]; + tensor var_658_axes_0 = const()[name = tensor("op_658_axes_0"), val = tensor([-1])]; + tensor blocks_5_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_5_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135826816)))]; + tensor blocks_5_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_5_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135828928)))]; + tensor var_647_to_fp16 = const()[name = tensor("op_647_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_658_cast = layer_norm(axes = var_658_axes_0, beta = blocks_5_attn_ln_bias_to_fp16, epsilon = var_647_to_fp16, gamma = blocks_5_attn_ln_weight_to_fp16, x = x_67_cast); + tensor var_669_to_fp16 = const()[name = tensor("op_669_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135831040)))]; + tensor var_670_to_fp16 = const()[name = tensor("op_670_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(137928256)))]; + tensor q_21_cast = linear(bias = var_670_to_fp16, weight = var_669_to_fp16, x = var_658_cast); + tensor var_673_to_fp16 = const()[name = tensor("op_673_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(137930368)))]; + tensor k_21_bias_0_to_fp16 = const()[name = tensor("k_21_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140027584)))]; + tensor k_21_cast = linear(bias = k_21_bias_0_to_fp16, weight = var_673_to_fp16, x = var_658_cast); + tensor var_677_to_fp16 = const()[name = tensor("op_677_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140029696)))]; + tensor var_678_to_fp16 = const()[name = tensor("op_678_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142126912)))]; + tensor v_21_cast = linear(bias = var_678_to_fp16, weight = var_677_to_fp16, x = var_658_cast); + tensor var_686 = const()[name = tensor("op_686"), val = tensor([1, 1500, 16, -1])]; + tensor var_687_cast = reshape(shape = var_686, x = q_21_cast); + tensor const_178_to_fp16 = const()[name = tensor("const_178_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_23_cast = mul(x = var_687_cast, y = const_178_to_fp16); + tensor var_693 = const()[name = tensor("op_693"), val = tensor([1, 1500, 16, -1])]; + tensor var_694_cast = reshape(shape = var_693, x = k_21_cast); + tensor const_179_to_fp16 = const()[name = tensor("const_179_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_23_cast = mul(x = var_694_cast, y = const_179_to_fp16); + tensor var_700 = const()[name = tensor("op_700"), val = tensor([1, 1500, 16, -1])]; + tensor var_701_cast = reshape(shape = var_700, x = v_21_cast); + tensor var_702 = const()[name = tensor("op_702"), val = tensor([0, 2, 1, 3])]; + tensor qk_11_transpose_x_0 = const()[name = tensor("qk_11_transpose_x_0"), val = tensor(false)]; + tensor qk_11_transpose_y_0 = const()[name = tensor("qk_11_transpose_y_0"), val = tensor(false)]; + tensor transpose_58_perm_0 = const()[name = tensor("transpose_58_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_59_perm_0 = const()[name = tensor("transpose_59_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_169 = transpose(perm = transpose_59_perm_0, x = k_23_cast); + tensor transpose_170 = transpose(perm = transpose_58_perm_0, x = q_23_cast); + tensor qk_11_cast = matmul(transpose_x = qk_11_transpose_x_0, transpose_y = qk_11_transpose_y_0, x = transpose_170, y = transpose_169); + tensor var_706_cast = softmax(axis = var_641, x = qk_11_cast); + tensor var_708_transpose_x_0 = const()[name = tensor("op_708_transpose_x_0"), val = tensor(false)]; + tensor var_708_transpose_y_0 = const()[name = tensor("op_708_transpose_y_0"), val = tensor(false)]; + tensor transpose_171 = transpose(perm = var_702, x = var_701_cast); + tensor var_708_cast = matmul(transpose_x = var_708_transpose_x_0, transpose_y = var_708_transpose_y_0, x = var_706_cast, y = transpose_171); + tensor var_709 = const()[name = tensor("op_709"), val = tensor([0, 2, 1, 3])]; + tensor concat_5 = const()[name = tensor("concat_5"), val = tensor([1, 1500, 1024])]; + tensor transpose_168 = transpose(perm = var_709, x = var_708_cast); + tensor x_71_cast = reshape(shape = concat_5, x = transpose_168); + tensor var_714_to_fp16 = const()[name = tensor("op_714_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142129024)))]; + tensor var_715_to_fp16 = const()[name = tensor("op_715_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144226240)))]; + tensor var_716_cast = linear(bias = var_715_to_fp16, weight = var_714_to_fp16, x = x_71_cast); + tensor x_73_cast = add(x = x_67_cast, y = var_716_cast); + tensor var_722_axes_0 = const()[name = tensor("op_722_axes_0"), val = tensor([-1])]; + tensor blocks_5_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144228352)))]; + tensor blocks_5_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144230464)))]; + tensor var_722_cast = layer_norm(axes = var_722_axes_0, beta = blocks_5_mlp_ln_bias_to_fp16, epsilon = var_647_to_fp16, gamma = blocks_5_mlp_ln_weight_to_fp16, x = x_73_cast); + tensor var_731_to_fp16 = const()[name = tensor("op_731_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144232576)))]; + tensor var_732_to_fp16 = const()[name = tensor("op_732_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(152621248)))]; + tensor input_49_cast = linear(bias = var_732_to_fp16, weight = var_731_to_fp16, x = var_722_cast); + tensor x_77_mode_0 = const()[name = tensor("x_77_mode_0"), val = tensor("EXACT")]; + tensor x_77_cast = gelu(mode = x_77_mode_0, x = input_49_cast); + tensor var_737_to_fp16 = const()[name = tensor("op_737_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(152629504)))]; + tensor var_738_to_fp16 = const()[name = tensor("op_738_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(161018176)))]; + tensor var_739_cast = linear(bias = var_738_to_fp16, weight = var_737_to_fp16, x = x_77_cast); + tensor x_79_cast = add(x = x_73_cast, y = var_739_cast); + tensor var_748 = const()[name = tensor("op_748"), val = tensor(-1)]; + tensor var_765_axes_0 = const()[name = tensor("op_765_axes_0"), val = tensor([-1])]; + tensor blocks_6_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_6_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(161020288)))]; + tensor blocks_6_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_6_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(161022400)))]; + tensor var_754_to_fp16 = const()[name = tensor("op_754_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_765_cast = layer_norm(axes = var_765_axes_0, beta = blocks_6_attn_ln_bias_to_fp16, epsilon = var_754_to_fp16, gamma = blocks_6_attn_ln_weight_to_fp16, x = x_79_cast); + tensor var_776_to_fp16 = const()[name = tensor("op_776_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(161024512)))]; + tensor var_777_to_fp16 = const()[name = tensor("op_777_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163121728)))]; + tensor q_25_cast = linear(bias = var_777_to_fp16, weight = var_776_to_fp16, x = var_765_cast); + tensor var_780_to_fp16 = const()[name = tensor("op_780_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163123840)))]; + tensor k_25_bias_0_to_fp16 = const()[name = tensor("k_25_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165221056)))]; + tensor k_25_cast = linear(bias = k_25_bias_0_to_fp16, weight = var_780_to_fp16, x = var_765_cast); + tensor var_784_to_fp16 = const()[name = tensor("op_784_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165223168)))]; + tensor var_785_to_fp16 = const()[name = tensor("op_785_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167320384)))]; + tensor v_25_cast = linear(bias = var_785_to_fp16, weight = var_784_to_fp16, x = var_765_cast); + tensor var_793 = const()[name = tensor("op_793"), val = tensor([1, 1500, 16, -1])]; + tensor var_794_cast = reshape(shape = var_793, x = q_25_cast); + tensor const_180_to_fp16 = const()[name = tensor("const_180_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_27_cast = mul(x = var_794_cast, y = const_180_to_fp16); + tensor var_800 = const()[name = tensor("op_800"), val = tensor([1, 1500, 16, -1])]; + tensor var_801_cast = reshape(shape = var_800, x = k_25_cast); + tensor const_181_to_fp16 = const()[name = tensor("const_181_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_27_cast = mul(x = var_801_cast, y = const_181_to_fp16); + tensor var_807 = const()[name = tensor("op_807"), val = tensor([1, 1500, 16, -1])]; + tensor var_808_cast = reshape(shape = var_807, x = v_25_cast); + tensor var_809 = const()[name = tensor("op_809"), val = tensor([0, 2, 1, 3])]; + tensor qk_13_transpose_x_0 = const()[name = tensor("qk_13_transpose_x_0"), val = tensor(false)]; + tensor qk_13_transpose_y_0 = const()[name = tensor("qk_13_transpose_y_0"), val = tensor(false)]; + tensor transpose_60_perm_0 = const()[name = tensor("transpose_60_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_61_perm_0 = const()[name = tensor("transpose_61_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_165 = transpose(perm = transpose_61_perm_0, x = k_27_cast); + tensor transpose_166 = transpose(perm = transpose_60_perm_0, x = q_27_cast); + tensor qk_13_cast = matmul(transpose_x = qk_13_transpose_x_0, transpose_y = qk_13_transpose_y_0, x = transpose_166, y = transpose_165); + tensor var_813_cast = softmax(axis = var_748, x = qk_13_cast); + tensor var_815_transpose_x_0 = const()[name = tensor("op_815_transpose_x_0"), val = tensor(false)]; + tensor var_815_transpose_y_0 = const()[name = tensor("op_815_transpose_y_0"), val = tensor(false)]; + tensor transpose_167 = transpose(perm = var_809, x = var_808_cast); + tensor var_815_cast = matmul(transpose_x = var_815_transpose_x_0, transpose_y = var_815_transpose_y_0, x = var_813_cast, y = transpose_167); + tensor var_816 = const()[name = tensor("op_816"), val = tensor([0, 2, 1, 3])]; + tensor concat_6 = const()[name = tensor("concat_6"), val = tensor([1, 1500, 1024])]; + tensor transpose_164 = transpose(perm = var_816, x = var_815_cast); + tensor x_83_cast = reshape(shape = concat_6, x = transpose_164); + tensor var_821_to_fp16 = const()[name = tensor("op_821_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167322496)))]; + tensor var_822_to_fp16 = const()[name = tensor("op_822_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169419712)))]; + tensor var_823_cast = linear(bias = var_822_to_fp16, weight = var_821_to_fp16, x = x_83_cast); + tensor x_85_cast = add(x = x_79_cast, y = var_823_cast); + tensor var_829_axes_0 = const()[name = tensor("op_829_axes_0"), val = tensor([-1])]; + tensor blocks_6_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_6_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169421824)))]; + tensor blocks_6_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_6_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169423936)))]; + tensor var_829_cast = layer_norm(axes = var_829_axes_0, beta = blocks_6_mlp_ln_bias_to_fp16, epsilon = var_754_to_fp16, gamma = blocks_6_mlp_ln_weight_to_fp16, x = x_85_cast); + tensor var_838_to_fp16 = const()[name = tensor("op_838_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169426048)))]; + tensor var_839_to_fp16 = const()[name = tensor("op_839_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177814720)))]; + tensor input_57_cast = linear(bias = var_839_to_fp16, weight = var_838_to_fp16, x = var_829_cast); + tensor x_89_mode_0 = const()[name = tensor("x_89_mode_0"), val = tensor("EXACT")]; + tensor x_89_cast = gelu(mode = x_89_mode_0, x = input_57_cast); + tensor var_844_to_fp16 = const()[name = tensor("op_844_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177822976)))]; + tensor var_845_to_fp16 = const()[name = tensor("op_845_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186211648)))]; + tensor var_846_cast = linear(bias = var_845_to_fp16, weight = var_844_to_fp16, x = x_89_cast); + tensor x_91_cast = add(x = x_85_cast, y = var_846_cast); + tensor var_855 = const()[name = tensor("op_855"), val = tensor(-1)]; + tensor var_872_axes_0 = const()[name = tensor("op_872_axes_0"), val = tensor([-1])]; + tensor blocks_7_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_7_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186213760)))]; + tensor blocks_7_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_7_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186215872)))]; + tensor var_861_to_fp16 = const()[name = tensor("op_861_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_872_cast = layer_norm(axes = var_872_axes_0, beta = blocks_7_attn_ln_bias_to_fp16, epsilon = var_861_to_fp16, gamma = blocks_7_attn_ln_weight_to_fp16, x = x_91_cast); + tensor var_883_to_fp16 = const()[name = tensor("op_883_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186217984)))]; + tensor var_884_to_fp16 = const()[name = tensor("op_884_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(188315200)))]; + tensor q_29_cast = linear(bias = var_884_to_fp16, weight = var_883_to_fp16, x = var_872_cast); + tensor var_887_to_fp16 = const()[name = tensor("op_887_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(188317312)))]; + tensor k_29_bias_0_to_fp16 = const()[name = tensor("k_29_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190414528)))]; + tensor k_29_cast = linear(bias = k_29_bias_0_to_fp16, weight = var_887_to_fp16, x = var_872_cast); + tensor var_891_to_fp16 = const()[name = tensor("op_891_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190416640)))]; + tensor var_892_to_fp16 = const()[name = tensor("op_892_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192513856)))]; + tensor v_29_cast = linear(bias = var_892_to_fp16, weight = var_891_to_fp16, x = var_872_cast); + tensor var_900 = const()[name = tensor("op_900"), val = tensor([1, 1500, 16, -1])]; + tensor var_901_cast = reshape(shape = var_900, x = q_29_cast); + tensor const_182_to_fp16 = const()[name = tensor("const_182_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_31_cast = mul(x = var_901_cast, y = const_182_to_fp16); + tensor var_907 = const()[name = tensor("op_907"), val = tensor([1, 1500, 16, -1])]; + tensor var_908_cast = reshape(shape = var_907, x = k_29_cast); + tensor const_183_to_fp16 = const()[name = tensor("const_183_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_31_cast = mul(x = var_908_cast, y = const_183_to_fp16); + tensor var_914 = const()[name = tensor("op_914"), val = tensor([1, 1500, 16, -1])]; + tensor var_915_cast = reshape(shape = var_914, x = v_29_cast); + tensor var_916 = const()[name = tensor("op_916"), val = tensor([0, 2, 1, 3])]; + tensor qk_15_transpose_x_0 = const()[name = tensor("qk_15_transpose_x_0"), val = tensor(false)]; + tensor qk_15_transpose_y_0 = const()[name = tensor("qk_15_transpose_y_0"), val = tensor(false)]; + tensor transpose_62_perm_0 = const()[name = tensor("transpose_62_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_63_perm_0 = const()[name = tensor("transpose_63_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_161 = transpose(perm = transpose_63_perm_0, x = k_31_cast); + tensor transpose_162 = transpose(perm = transpose_62_perm_0, x = q_31_cast); + tensor qk_15_cast = matmul(transpose_x = qk_15_transpose_x_0, transpose_y = qk_15_transpose_y_0, x = transpose_162, y = transpose_161); + tensor var_920_cast = softmax(axis = var_855, x = qk_15_cast); + tensor var_922_transpose_x_0 = const()[name = tensor("op_922_transpose_x_0"), val = tensor(false)]; + tensor var_922_transpose_y_0 = const()[name = tensor("op_922_transpose_y_0"), val = tensor(false)]; + tensor transpose_163 = transpose(perm = var_916, x = var_915_cast); + tensor var_922_cast = matmul(transpose_x = var_922_transpose_x_0, transpose_y = var_922_transpose_y_0, x = var_920_cast, y = transpose_163); + tensor var_923 = const()[name = tensor("op_923"), val = tensor([0, 2, 1, 3])]; + tensor concat_7 = const()[name = tensor("concat_7"), val = tensor([1, 1500, 1024])]; + tensor transpose_160 = transpose(perm = var_923, x = var_922_cast); + tensor x_95_cast = reshape(shape = concat_7, x = transpose_160); + tensor var_928_to_fp16 = const()[name = tensor("op_928_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192515968)))]; + tensor var_929_to_fp16 = const()[name = tensor("op_929_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194613184)))]; + tensor var_930_cast = linear(bias = var_929_to_fp16, weight = var_928_to_fp16, x = x_95_cast); + tensor x_97_cast = add(x = x_91_cast, y = var_930_cast); + tensor var_936_axes_0 = const()[name = tensor("op_936_axes_0"), val = tensor([-1])]; + tensor blocks_7_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_7_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194615296)))]; + tensor blocks_7_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_7_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194617408)))]; + tensor var_936_cast = layer_norm(axes = var_936_axes_0, beta = blocks_7_mlp_ln_bias_to_fp16, epsilon = var_861_to_fp16, gamma = blocks_7_mlp_ln_weight_to_fp16, x = x_97_cast); + tensor var_945_to_fp16 = const()[name = tensor("op_945_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194619520)))]; + tensor var_946_to_fp16 = const()[name = tensor("op_946_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(203008192)))]; + tensor input_65_cast = linear(bias = var_946_to_fp16, weight = var_945_to_fp16, x = var_936_cast); + tensor x_101_mode_0 = const()[name = tensor("x_101_mode_0"), val = tensor("EXACT")]; + tensor x_101_cast = gelu(mode = x_101_mode_0, x = input_65_cast); + tensor var_951_to_fp16 = const()[name = tensor("op_951_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(203016448)))]; + tensor var_952_to_fp16 = const()[name = tensor("op_952_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211405120)))]; + tensor var_953_cast = linear(bias = var_952_to_fp16, weight = var_951_to_fp16, x = x_101_cast); + tensor x_103_cast = add(x = x_97_cast, y = var_953_cast); + tensor var_962 = const()[name = tensor("op_962"), val = tensor(-1)]; + tensor var_979_axes_0 = const()[name = tensor("op_979_axes_0"), val = tensor([-1])]; + tensor blocks_8_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_8_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211407232)))]; + tensor blocks_8_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_8_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211409344)))]; + tensor var_968_to_fp16 = const()[name = tensor("op_968_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_979_cast = layer_norm(axes = var_979_axes_0, beta = blocks_8_attn_ln_bias_to_fp16, epsilon = var_968_to_fp16, gamma = blocks_8_attn_ln_weight_to_fp16, x = x_103_cast); + tensor var_990_to_fp16 = const()[name = tensor("op_990_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211411456)))]; + tensor var_991_to_fp16 = const()[name = tensor("op_991_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(213508672)))]; + tensor q_33_cast = linear(bias = var_991_to_fp16, weight = var_990_to_fp16, x = var_979_cast); + tensor var_994_to_fp16 = const()[name = tensor("op_994_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(213510784)))]; + tensor k_33_bias_0_to_fp16 = const()[name = tensor("k_33_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215608000)))]; + tensor k_33_cast = linear(bias = k_33_bias_0_to_fp16, weight = var_994_to_fp16, x = var_979_cast); + tensor var_998_to_fp16 = const()[name = tensor("op_998_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215610112)))]; + tensor var_999_to_fp16 = const()[name = tensor("op_999_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217707328)))]; + tensor v_33_cast = linear(bias = var_999_to_fp16, weight = var_998_to_fp16, x = var_979_cast); + tensor var_1007 = const()[name = tensor("op_1007"), val = tensor([1, 1500, 16, -1])]; + tensor var_1008_cast = reshape(shape = var_1007, x = q_33_cast); + tensor const_184_to_fp16 = const()[name = tensor("const_184_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_35_cast = mul(x = var_1008_cast, y = const_184_to_fp16); + tensor var_1014 = const()[name = tensor("op_1014"), val = tensor([1, 1500, 16, -1])]; + tensor var_1015_cast = reshape(shape = var_1014, x = k_33_cast); + tensor const_185_to_fp16 = const()[name = tensor("const_185_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_35_cast = mul(x = var_1015_cast, y = const_185_to_fp16); + tensor var_1021 = const()[name = tensor("op_1021"), val = tensor([1, 1500, 16, -1])]; + tensor var_1022_cast = reshape(shape = var_1021, x = v_33_cast); + tensor var_1023 = const()[name = tensor("op_1023"), val = tensor([0, 2, 1, 3])]; + tensor qk_17_transpose_x_0 = const()[name = tensor("qk_17_transpose_x_0"), val = tensor(false)]; + tensor qk_17_transpose_y_0 = const()[name = tensor("qk_17_transpose_y_0"), val = tensor(false)]; + tensor transpose_64_perm_0 = const()[name = tensor("transpose_64_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_65_perm_0 = const()[name = tensor("transpose_65_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_157 = transpose(perm = transpose_65_perm_0, x = k_35_cast); + tensor transpose_158 = transpose(perm = transpose_64_perm_0, x = q_35_cast); + tensor qk_17_cast = matmul(transpose_x = qk_17_transpose_x_0, transpose_y = qk_17_transpose_y_0, x = transpose_158, y = transpose_157); + tensor var_1027_cast = softmax(axis = var_962, x = qk_17_cast); + tensor var_1029_transpose_x_0 = const()[name = tensor("op_1029_transpose_x_0"), val = tensor(false)]; + tensor var_1029_transpose_y_0 = const()[name = tensor("op_1029_transpose_y_0"), val = tensor(false)]; + tensor transpose_159 = transpose(perm = var_1023, x = var_1022_cast); + tensor var_1029_cast = matmul(transpose_x = var_1029_transpose_x_0, transpose_y = var_1029_transpose_y_0, x = var_1027_cast, y = transpose_159); + tensor var_1030 = const()[name = tensor("op_1030"), val = tensor([0, 2, 1, 3])]; + tensor concat_8 = const()[name = tensor("concat_8"), val = tensor([1, 1500, 1024])]; + tensor transpose_156 = transpose(perm = var_1030, x = var_1029_cast); + tensor x_107_cast = reshape(shape = concat_8, x = transpose_156); + tensor var_1035_to_fp16 = const()[name = tensor("op_1035_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217709440)))]; + tensor var_1036_to_fp16 = const()[name = tensor("op_1036_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219806656)))]; + tensor var_1037_cast = linear(bias = var_1036_to_fp16, weight = var_1035_to_fp16, x = x_107_cast); + tensor x_109_cast = add(x = x_103_cast, y = var_1037_cast); + tensor var_1043_axes_0 = const()[name = tensor("op_1043_axes_0"), val = tensor([-1])]; + tensor blocks_8_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_8_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219808768)))]; + tensor blocks_8_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_8_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219810880)))]; + tensor var_1043_cast = layer_norm(axes = var_1043_axes_0, beta = blocks_8_mlp_ln_bias_to_fp16, epsilon = var_968_to_fp16, gamma = blocks_8_mlp_ln_weight_to_fp16, x = x_109_cast); + tensor var_1052_to_fp16 = const()[name = tensor("op_1052_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219812992)))]; + tensor var_1053_to_fp16 = const()[name = tensor("op_1053_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(228201664)))]; + tensor input_73_cast = linear(bias = var_1053_to_fp16, weight = var_1052_to_fp16, x = var_1043_cast); + tensor x_113_mode_0 = const()[name = tensor("x_113_mode_0"), val = tensor("EXACT")]; + tensor x_113_cast = gelu(mode = x_113_mode_0, x = input_73_cast); + tensor var_1058_to_fp16 = const()[name = tensor("op_1058_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(228209920)))]; + tensor var_1059_to_fp16 = const()[name = tensor("op_1059_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236598592)))]; + tensor var_1060_cast = linear(bias = var_1059_to_fp16, weight = var_1058_to_fp16, x = x_113_cast); + tensor x_115_cast = add(x = x_109_cast, y = var_1060_cast); + tensor var_1069 = const()[name = tensor("op_1069"), val = tensor(-1)]; + tensor var_1086_axes_0 = const()[name = tensor("op_1086_axes_0"), val = tensor([-1])]; + tensor blocks_9_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_9_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236600704)))]; + tensor blocks_9_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_9_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236602816)))]; + tensor var_1075_to_fp16 = const()[name = tensor("op_1075_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1086_cast = layer_norm(axes = var_1086_axes_0, beta = blocks_9_attn_ln_bias_to_fp16, epsilon = var_1075_to_fp16, gamma = blocks_9_attn_ln_weight_to_fp16, x = x_115_cast); + tensor var_1097_to_fp16 = const()[name = tensor("op_1097_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236604928)))]; + tensor var_1098_to_fp16 = const()[name = tensor("op_1098_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(238702144)))]; + tensor q_37_cast = linear(bias = var_1098_to_fp16, weight = var_1097_to_fp16, x = var_1086_cast); + tensor var_1101_to_fp16 = const()[name = tensor("op_1101_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(238704256)))]; + tensor k_37_bias_0_to_fp16 = const()[name = tensor("k_37_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240801472)))]; + tensor k_37_cast = linear(bias = k_37_bias_0_to_fp16, weight = var_1101_to_fp16, x = var_1086_cast); + tensor var_1105_to_fp16 = const()[name = tensor("op_1105_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240803584)))]; + tensor var_1106_to_fp16 = const()[name = tensor("op_1106_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(242900800)))]; + tensor v_37_cast = linear(bias = var_1106_to_fp16, weight = var_1105_to_fp16, x = var_1086_cast); + tensor var_1114 = const()[name = tensor("op_1114"), val = tensor([1, 1500, 16, -1])]; + tensor var_1115_cast = reshape(shape = var_1114, x = q_37_cast); + tensor const_186_to_fp16 = const()[name = tensor("const_186_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_39_cast = mul(x = var_1115_cast, y = const_186_to_fp16); + tensor var_1121 = const()[name = tensor("op_1121"), val = tensor([1, 1500, 16, -1])]; + tensor var_1122_cast = reshape(shape = var_1121, x = k_37_cast); + tensor const_187_to_fp16 = const()[name = tensor("const_187_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_39_cast = mul(x = var_1122_cast, y = const_187_to_fp16); + tensor var_1128 = const()[name = tensor("op_1128"), val = tensor([1, 1500, 16, -1])]; + tensor var_1129_cast = reshape(shape = var_1128, x = v_37_cast); + tensor var_1130 = const()[name = tensor("op_1130"), val = tensor([0, 2, 1, 3])]; + tensor qk_19_transpose_x_0 = const()[name = tensor("qk_19_transpose_x_0"), val = tensor(false)]; + tensor qk_19_transpose_y_0 = const()[name = tensor("qk_19_transpose_y_0"), val = tensor(false)]; + tensor transpose_66_perm_0 = const()[name = tensor("transpose_66_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_67_perm_0 = const()[name = tensor("transpose_67_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_153 = transpose(perm = transpose_67_perm_0, x = k_39_cast); + tensor transpose_154 = transpose(perm = transpose_66_perm_0, x = q_39_cast); + tensor qk_19_cast = matmul(transpose_x = qk_19_transpose_x_0, transpose_y = qk_19_transpose_y_0, x = transpose_154, y = transpose_153); + tensor var_1134_cast = softmax(axis = var_1069, x = qk_19_cast); + tensor var_1136_transpose_x_0 = const()[name = tensor("op_1136_transpose_x_0"), val = tensor(false)]; + tensor var_1136_transpose_y_0 = const()[name = tensor("op_1136_transpose_y_0"), val = tensor(false)]; + tensor transpose_155 = transpose(perm = var_1130, x = var_1129_cast); + tensor var_1136_cast = matmul(transpose_x = var_1136_transpose_x_0, transpose_y = var_1136_transpose_y_0, x = var_1134_cast, y = transpose_155); + tensor var_1137 = const()[name = tensor("op_1137"), val = tensor([0, 2, 1, 3])]; + tensor concat_9 = const()[name = tensor("concat_9"), val = tensor([1, 1500, 1024])]; + tensor transpose_152 = transpose(perm = var_1137, x = var_1136_cast); + tensor x_119_cast = reshape(shape = concat_9, x = transpose_152); + tensor var_1142_to_fp16 = const()[name = tensor("op_1142_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(242902912)))]; + tensor var_1143_to_fp16 = const()[name = tensor("op_1143_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245000128)))]; + tensor var_1144_cast = linear(bias = var_1143_to_fp16, weight = var_1142_to_fp16, x = x_119_cast); + tensor x_121_cast = add(x = x_115_cast, y = var_1144_cast); + tensor var_1150_axes_0 = const()[name = tensor("op_1150_axes_0"), val = tensor([-1])]; + tensor blocks_9_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_9_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245002240)))]; + tensor blocks_9_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_9_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245004352)))]; + tensor var_1150_cast = layer_norm(axes = var_1150_axes_0, beta = blocks_9_mlp_ln_bias_to_fp16, epsilon = var_1075_to_fp16, gamma = blocks_9_mlp_ln_weight_to_fp16, x = x_121_cast); + tensor var_1159_to_fp16 = const()[name = tensor("op_1159_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245006464)))]; + tensor var_1160_to_fp16 = const()[name = tensor("op_1160_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253395136)))]; + tensor input_81_cast = linear(bias = var_1160_to_fp16, weight = var_1159_to_fp16, x = var_1150_cast); + tensor x_125_mode_0 = const()[name = tensor("x_125_mode_0"), val = tensor("EXACT")]; + tensor x_125_cast = gelu(mode = x_125_mode_0, x = input_81_cast); + tensor var_1165_to_fp16 = const()[name = tensor("op_1165_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253403392)))]; + tensor var_1166_to_fp16 = const()[name = tensor("op_1166_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(261792064)))]; + tensor var_1167_cast = linear(bias = var_1166_to_fp16, weight = var_1165_to_fp16, x = x_125_cast); + tensor x_127_cast = add(x = x_121_cast, y = var_1167_cast); + tensor var_1176 = const()[name = tensor("op_1176"), val = tensor(-1)]; + tensor var_1193_axes_0 = const()[name = tensor("op_1193_axes_0"), val = tensor([-1])]; + tensor blocks_10_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_10_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(261794176)))]; + tensor blocks_10_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_10_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(261796288)))]; + tensor var_1182_to_fp16 = const()[name = tensor("op_1182_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1193_cast = layer_norm(axes = var_1193_axes_0, beta = blocks_10_attn_ln_bias_to_fp16, epsilon = var_1182_to_fp16, gamma = blocks_10_attn_ln_weight_to_fp16, x = x_127_cast); + tensor var_1204_to_fp16 = const()[name = tensor("op_1204_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(261798400)))]; + tensor var_1205_to_fp16 = const()[name = tensor("op_1205_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263895616)))]; + tensor q_41_cast = linear(bias = var_1205_to_fp16, weight = var_1204_to_fp16, x = var_1193_cast); + tensor var_1208_to_fp16 = const()[name = tensor("op_1208_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263897728)))]; + tensor k_41_bias_0_to_fp16 = const()[name = tensor("k_41_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265994944)))]; + tensor k_41_cast = linear(bias = k_41_bias_0_to_fp16, weight = var_1208_to_fp16, x = var_1193_cast); + tensor var_1212_to_fp16 = const()[name = tensor("op_1212_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265997056)))]; + tensor var_1213_to_fp16 = const()[name = tensor("op_1213_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268094272)))]; + tensor v_41_cast = linear(bias = var_1213_to_fp16, weight = var_1212_to_fp16, x = var_1193_cast); + tensor var_1221 = const()[name = tensor("op_1221"), val = tensor([1, 1500, 16, -1])]; + tensor var_1222_cast = reshape(shape = var_1221, x = q_41_cast); + tensor const_188_to_fp16 = const()[name = tensor("const_188_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_43_cast = mul(x = var_1222_cast, y = const_188_to_fp16); + tensor var_1228 = const()[name = tensor("op_1228"), val = tensor([1, 1500, 16, -1])]; + tensor var_1229_cast = reshape(shape = var_1228, x = k_41_cast); + tensor const_189_to_fp16 = const()[name = tensor("const_189_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_43_cast = mul(x = var_1229_cast, y = const_189_to_fp16); + tensor var_1235 = const()[name = tensor("op_1235"), val = tensor([1, 1500, 16, -1])]; + tensor var_1236_cast = reshape(shape = var_1235, x = v_41_cast); + tensor var_1237 = const()[name = tensor("op_1237"), val = tensor([0, 2, 1, 3])]; + tensor qk_21_transpose_x_0 = const()[name = tensor("qk_21_transpose_x_0"), val = tensor(false)]; + tensor qk_21_transpose_y_0 = const()[name = tensor("qk_21_transpose_y_0"), val = tensor(false)]; + tensor transpose_68_perm_0 = const()[name = tensor("transpose_68_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_69_perm_0 = const()[name = tensor("transpose_69_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_149 = transpose(perm = transpose_69_perm_0, x = k_43_cast); + tensor transpose_150 = transpose(perm = transpose_68_perm_0, x = q_43_cast); + tensor qk_21_cast = matmul(transpose_x = qk_21_transpose_x_0, transpose_y = qk_21_transpose_y_0, x = transpose_150, y = transpose_149); + tensor var_1241_cast = softmax(axis = var_1176, x = qk_21_cast); + tensor var_1243_transpose_x_0 = const()[name = tensor("op_1243_transpose_x_0"), val = tensor(false)]; + tensor var_1243_transpose_y_0 = const()[name = tensor("op_1243_transpose_y_0"), val = tensor(false)]; + tensor transpose_151 = transpose(perm = var_1237, x = var_1236_cast); + tensor var_1243_cast = matmul(transpose_x = var_1243_transpose_x_0, transpose_y = var_1243_transpose_y_0, x = var_1241_cast, y = transpose_151); + tensor var_1244 = const()[name = tensor("op_1244"), val = tensor([0, 2, 1, 3])]; + tensor concat_10 = const()[name = tensor("concat_10"), val = tensor([1, 1500, 1024])]; + tensor transpose_148 = transpose(perm = var_1244, x = var_1243_cast); + tensor x_131_cast = reshape(shape = concat_10, x = transpose_148); + tensor var_1249_to_fp16 = const()[name = tensor("op_1249_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268096384)))]; + tensor var_1250_to_fp16 = const()[name = tensor("op_1250_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270193600)))]; + tensor var_1251_cast = linear(bias = var_1250_to_fp16, weight = var_1249_to_fp16, x = x_131_cast); + tensor x_133_cast = add(x = x_127_cast, y = var_1251_cast); + tensor var_1257_axes_0 = const()[name = tensor("op_1257_axes_0"), val = tensor([-1])]; + tensor blocks_10_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_10_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270195712)))]; + tensor blocks_10_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_10_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270197824)))]; + tensor var_1257_cast = layer_norm(axes = var_1257_axes_0, beta = blocks_10_mlp_ln_bias_to_fp16, epsilon = var_1182_to_fp16, gamma = blocks_10_mlp_ln_weight_to_fp16, x = x_133_cast); + tensor var_1266_to_fp16 = const()[name = tensor("op_1266_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270199936)))]; + tensor var_1267_to_fp16 = const()[name = tensor("op_1267_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278588608)))]; + tensor input_89_cast = linear(bias = var_1267_to_fp16, weight = var_1266_to_fp16, x = var_1257_cast); + tensor x_137_mode_0 = const()[name = tensor("x_137_mode_0"), val = tensor("EXACT")]; + tensor x_137_cast = gelu(mode = x_137_mode_0, x = input_89_cast); + tensor var_1272_to_fp16 = const()[name = tensor("op_1272_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278596864)))]; + tensor var_1273_to_fp16 = const()[name = tensor("op_1273_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286985536)))]; + tensor var_1274_cast = linear(bias = var_1273_to_fp16, weight = var_1272_to_fp16, x = x_137_cast); + tensor x_139_cast = add(x = x_133_cast, y = var_1274_cast); + tensor var_1283 = const()[name = tensor("op_1283"), val = tensor(-1)]; + tensor var_1300_axes_0 = const()[name = tensor("op_1300_axes_0"), val = tensor([-1])]; + tensor blocks_11_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_11_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286987648)))]; + tensor blocks_11_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_11_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286989760)))]; + tensor var_1289_to_fp16 = const()[name = tensor("op_1289_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1300_cast = layer_norm(axes = var_1300_axes_0, beta = blocks_11_attn_ln_bias_to_fp16, epsilon = var_1289_to_fp16, gamma = blocks_11_attn_ln_weight_to_fp16, x = x_139_cast); + tensor var_1311_to_fp16 = const()[name = tensor("op_1311_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286991872)))]; + tensor var_1312_to_fp16 = const()[name = tensor("op_1312_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(289089088)))]; + tensor q_45_cast = linear(bias = var_1312_to_fp16, weight = var_1311_to_fp16, x = var_1300_cast); + tensor var_1315_to_fp16 = const()[name = tensor("op_1315_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(289091200)))]; + tensor k_45_bias_0_to_fp16 = const()[name = tensor("k_45_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291188416)))]; + tensor k_45_cast = linear(bias = k_45_bias_0_to_fp16, weight = var_1315_to_fp16, x = var_1300_cast); + tensor var_1319_to_fp16 = const()[name = tensor("op_1319_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291190528)))]; + tensor var_1320_to_fp16 = const()[name = tensor("op_1320_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293287744)))]; + tensor v_45_cast = linear(bias = var_1320_to_fp16, weight = var_1319_to_fp16, x = var_1300_cast); + tensor var_1328 = const()[name = tensor("op_1328"), val = tensor([1, 1500, 16, -1])]; + tensor var_1329_cast = reshape(shape = var_1328, x = q_45_cast); + tensor const_190_to_fp16 = const()[name = tensor("const_190_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_47_cast = mul(x = var_1329_cast, y = const_190_to_fp16); + tensor var_1335 = const()[name = tensor("op_1335"), val = tensor([1, 1500, 16, -1])]; + tensor var_1336_cast = reshape(shape = var_1335, x = k_45_cast); + tensor const_191_to_fp16 = const()[name = tensor("const_191_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_47_cast = mul(x = var_1336_cast, y = const_191_to_fp16); + tensor var_1342 = const()[name = tensor("op_1342"), val = tensor([1, 1500, 16, -1])]; + tensor var_1343_cast = reshape(shape = var_1342, x = v_45_cast); + tensor var_1344 = const()[name = tensor("op_1344"), val = tensor([0, 2, 1, 3])]; + tensor qk_23_transpose_x_0 = const()[name = tensor("qk_23_transpose_x_0"), val = tensor(false)]; + tensor qk_23_transpose_y_0 = const()[name = tensor("qk_23_transpose_y_0"), val = tensor(false)]; + tensor transpose_70_perm_0 = const()[name = tensor("transpose_70_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_71_perm_0 = const()[name = tensor("transpose_71_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_145 = transpose(perm = transpose_71_perm_0, x = k_47_cast); + tensor transpose_146 = transpose(perm = transpose_70_perm_0, x = q_47_cast); + tensor qk_23_cast = matmul(transpose_x = qk_23_transpose_x_0, transpose_y = qk_23_transpose_y_0, x = transpose_146, y = transpose_145); + tensor var_1348_cast = softmax(axis = var_1283, x = qk_23_cast); + tensor var_1350_transpose_x_0 = const()[name = tensor("op_1350_transpose_x_0"), val = tensor(false)]; + tensor var_1350_transpose_y_0 = const()[name = tensor("op_1350_transpose_y_0"), val = tensor(false)]; + tensor transpose_147 = transpose(perm = var_1344, x = var_1343_cast); + tensor var_1350_cast = matmul(transpose_x = var_1350_transpose_x_0, transpose_y = var_1350_transpose_y_0, x = var_1348_cast, y = transpose_147); + tensor var_1351 = const()[name = tensor("op_1351"), val = tensor([0, 2, 1, 3])]; + tensor concat_11 = const()[name = tensor("concat_11"), val = tensor([1, 1500, 1024])]; + tensor transpose_144 = transpose(perm = var_1351, x = var_1350_cast); + tensor x_143_cast = reshape(shape = concat_11, x = transpose_144); + tensor var_1356_to_fp16 = const()[name = tensor("op_1356_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293289856)))]; + tensor var_1357_to_fp16 = const()[name = tensor("op_1357_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295387072)))]; + tensor var_1358_cast = linear(bias = var_1357_to_fp16, weight = var_1356_to_fp16, x = x_143_cast); + tensor x_145_cast = add(x = x_139_cast, y = var_1358_cast); + tensor var_1364_axes_0 = const()[name = tensor("op_1364_axes_0"), val = tensor([-1])]; + tensor blocks_11_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_11_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295389184)))]; + tensor blocks_11_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_11_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295391296)))]; + tensor var_1364_cast = layer_norm(axes = var_1364_axes_0, beta = blocks_11_mlp_ln_bias_to_fp16, epsilon = var_1289_to_fp16, gamma = blocks_11_mlp_ln_weight_to_fp16, x = x_145_cast); + tensor var_1373_to_fp16 = const()[name = tensor("op_1373_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295393408)))]; + tensor var_1374_to_fp16 = const()[name = tensor("op_1374_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303782080)))]; + tensor input_97_cast = linear(bias = var_1374_to_fp16, weight = var_1373_to_fp16, x = var_1364_cast); + tensor x_149_mode_0 = const()[name = tensor("x_149_mode_0"), val = tensor("EXACT")]; + tensor x_149_cast = gelu(mode = x_149_mode_0, x = input_97_cast); + tensor var_1379_to_fp16 = const()[name = tensor("op_1379_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303790336)))]; + tensor var_1380_to_fp16 = const()[name = tensor("op_1380_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312179008)))]; + tensor var_1381_cast = linear(bias = var_1380_to_fp16, weight = var_1379_to_fp16, x = x_149_cast); + tensor x_151_cast = add(x = x_145_cast, y = var_1381_cast); + tensor var_1390 = const()[name = tensor("op_1390"), val = tensor(-1)]; + tensor var_1407_axes_0 = const()[name = tensor("op_1407_axes_0"), val = tensor([-1])]; + tensor blocks_12_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_12_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312181120)))]; + tensor blocks_12_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_12_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312183232)))]; + tensor var_1396_to_fp16 = const()[name = tensor("op_1396_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1407_cast = layer_norm(axes = var_1407_axes_0, beta = blocks_12_attn_ln_bias_to_fp16, epsilon = var_1396_to_fp16, gamma = blocks_12_attn_ln_weight_to_fp16, x = x_151_cast); + tensor var_1418_to_fp16 = const()[name = tensor("op_1418_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312185344)))]; + tensor var_1419_to_fp16 = const()[name = tensor("op_1419_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(314282560)))]; + tensor q_49_cast = linear(bias = var_1419_to_fp16, weight = var_1418_to_fp16, x = var_1407_cast); + tensor var_1422_to_fp16 = const()[name = tensor("op_1422_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(314284672)))]; + tensor k_49_bias_0_to_fp16 = const()[name = tensor("k_49_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316381888)))]; + tensor k_49_cast = linear(bias = k_49_bias_0_to_fp16, weight = var_1422_to_fp16, x = var_1407_cast); + tensor var_1426_to_fp16 = const()[name = tensor("op_1426_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316384000)))]; + tensor var_1427_to_fp16 = const()[name = tensor("op_1427_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(318481216)))]; + tensor v_49_cast = linear(bias = var_1427_to_fp16, weight = var_1426_to_fp16, x = var_1407_cast); + tensor var_1435 = const()[name = tensor("op_1435"), val = tensor([1, 1500, 16, -1])]; + tensor var_1436_cast = reshape(shape = var_1435, x = q_49_cast); + tensor const_192_to_fp16 = const()[name = tensor("const_192_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_51_cast = mul(x = var_1436_cast, y = const_192_to_fp16); + tensor var_1442 = const()[name = tensor("op_1442"), val = tensor([1, 1500, 16, -1])]; + tensor var_1443_cast = reshape(shape = var_1442, x = k_49_cast); + tensor const_193_to_fp16 = const()[name = tensor("const_193_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_51_cast = mul(x = var_1443_cast, y = const_193_to_fp16); + tensor var_1449 = const()[name = tensor("op_1449"), val = tensor([1, 1500, 16, -1])]; + tensor var_1450_cast = reshape(shape = var_1449, x = v_49_cast); + tensor var_1451 = const()[name = tensor("op_1451"), val = tensor([0, 2, 1, 3])]; + tensor qk_25_transpose_x_0 = const()[name = tensor("qk_25_transpose_x_0"), val = tensor(false)]; + tensor qk_25_transpose_y_0 = const()[name = tensor("qk_25_transpose_y_0"), val = tensor(false)]; + tensor transpose_72_perm_0 = const()[name = tensor("transpose_72_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_73_perm_0 = const()[name = tensor("transpose_73_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_141 = transpose(perm = transpose_73_perm_0, x = k_51_cast); + tensor transpose_142 = transpose(perm = transpose_72_perm_0, x = q_51_cast); + tensor qk_25_cast = matmul(transpose_x = qk_25_transpose_x_0, transpose_y = qk_25_transpose_y_0, x = transpose_142, y = transpose_141); + tensor var_1455_cast = softmax(axis = var_1390, x = qk_25_cast); + tensor var_1457_transpose_x_0 = const()[name = tensor("op_1457_transpose_x_0"), val = tensor(false)]; + tensor var_1457_transpose_y_0 = const()[name = tensor("op_1457_transpose_y_0"), val = tensor(false)]; + tensor transpose_143 = transpose(perm = var_1451, x = var_1450_cast); + tensor var_1457_cast = matmul(transpose_x = var_1457_transpose_x_0, transpose_y = var_1457_transpose_y_0, x = var_1455_cast, y = transpose_143); + tensor var_1458 = const()[name = tensor("op_1458"), val = tensor([0, 2, 1, 3])]; + tensor concat_12 = const()[name = tensor("concat_12"), val = tensor([1, 1500, 1024])]; + tensor transpose_140 = transpose(perm = var_1458, x = var_1457_cast); + tensor x_155_cast = reshape(shape = concat_12, x = transpose_140); + tensor var_1463_to_fp16 = const()[name = tensor("op_1463_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(318483328)))]; + tensor var_1464_to_fp16 = const()[name = tensor("op_1464_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320580544)))]; + tensor var_1465_cast = linear(bias = var_1464_to_fp16, weight = var_1463_to_fp16, x = x_155_cast); + tensor x_157_cast = add(x = x_151_cast, y = var_1465_cast); + tensor var_1471_axes_0 = const()[name = tensor("op_1471_axes_0"), val = tensor([-1])]; + tensor blocks_12_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_12_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320582656)))]; + tensor blocks_12_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_12_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320584768)))]; + tensor var_1471_cast = layer_norm(axes = var_1471_axes_0, beta = blocks_12_mlp_ln_bias_to_fp16, epsilon = var_1396_to_fp16, gamma = blocks_12_mlp_ln_weight_to_fp16, x = x_157_cast); + tensor var_1480_to_fp16 = const()[name = tensor("op_1480_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320586880)))]; + tensor var_1481_to_fp16 = const()[name = tensor("op_1481_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(328975552)))]; + tensor input_105_cast = linear(bias = var_1481_to_fp16, weight = var_1480_to_fp16, x = var_1471_cast); + tensor x_161_mode_0 = const()[name = tensor("x_161_mode_0"), val = tensor("EXACT")]; + tensor x_161_cast = gelu(mode = x_161_mode_0, x = input_105_cast); + tensor var_1486_to_fp16 = const()[name = tensor("op_1486_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(328983808)))]; + tensor var_1487_to_fp16 = const()[name = tensor("op_1487_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337372480)))]; + tensor var_1488_cast = linear(bias = var_1487_to_fp16, weight = var_1486_to_fp16, x = x_161_cast); + tensor x_163_cast = add(x = x_157_cast, y = var_1488_cast); + tensor var_1497 = const()[name = tensor("op_1497"), val = tensor(-1)]; + tensor var_1514_axes_0 = const()[name = tensor("op_1514_axes_0"), val = tensor([-1])]; + tensor blocks_13_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_13_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337374592)))]; + tensor blocks_13_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_13_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337376704)))]; + tensor var_1503_to_fp16 = const()[name = tensor("op_1503_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1514_cast = layer_norm(axes = var_1514_axes_0, beta = blocks_13_attn_ln_bias_to_fp16, epsilon = var_1503_to_fp16, gamma = blocks_13_attn_ln_weight_to_fp16, x = x_163_cast); + tensor var_1525_to_fp16 = const()[name = tensor("op_1525_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337378816)))]; + tensor var_1526_to_fp16 = const()[name = tensor("op_1526_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339476032)))]; + tensor q_53_cast = linear(bias = var_1526_to_fp16, weight = var_1525_to_fp16, x = var_1514_cast); + tensor var_1529_to_fp16 = const()[name = tensor("op_1529_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339478144)))]; + tensor k_53_bias_0_to_fp16 = const()[name = tensor("k_53_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341575360)))]; + tensor k_53_cast = linear(bias = k_53_bias_0_to_fp16, weight = var_1529_to_fp16, x = var_1514_cast); + tensor var_1533_to_fp16 = const()[name = tensor("op_1533_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341577472)))]; + tensor var_1534_to_fp16 = const()[name = tensor("op_1534_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(343674688)))]; + tensor v_53_cast = linear(bias = var_1534_to_fp16, weight = var_1533_to_fp16, x = var_1514_cast); + tensor var_1542 = const()[name = tensor("op_1542"), val = tensor([1, 1500, 16, -1])]; + tensor var_1543_cast = reshape(shape = var_1542, x = q_53_cast); + tensor const_194_to_fp16 = const()[name = tensor("const_194_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_55_cast = mul(x = var_1543_cast, y = const_194_to_fp16); + tensor var_1549 = const()[name = tensor("op_1549"), val = tensor([1, 1500, 16, -1])]; + tensor var_1550_cast = reshape(shape = var_1549, x = k_53_cast); + tensor const_195_to_fp16 = const()[name = tensor("const_195_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_55_cast = mul(x = var_1550_cast, y = const_195_to_fp16); + tensor var_1556 = const()[name = tensor("op_1556"), val = tensor([1, 1500, 16, -1])]; + tensor var_1557_cast = reshape(shape = var_1556, x = v_53_cast); + tensor var_1558 = const()[name = tensor("op_1558"), val = tensor([0, 2, 1, 3])]; + tensor qk_27_transpose_x_0 = const()[name = tensor("qk_27_transpose_x_0"), val = tensor(false)]; + tensor qk_27_transpose_y_0 = const()[name = tensor("qk_27_transpose_y_0"), val = tensor(false)]; + tensor transpose_74_perm_0 = const()[name = tensor("transpose_74_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_75_perm_0 = const()[name = tensor("transpose_75_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_137 = transpose(perm = transpose_75_perm_0, x = k_55_cast); + tensor transpose_138 = transpose(perm = transpose_74_perm_0, x = q_55_cast); + tensor qk_27_cast = matmul(transpose_x = qk_27_transpose_x_0, transpose_y = qk_27_transpose_y_0, x = transpose_138, y = transpose_137); + tensor var_1562_cast = softmax(axis = var_1497, x = qk_27_cast); + tensor var_1564_transpose_x_0 = const()[name = tensor("op_1564_transpose_x_0"), val = tensor(false)]; + tensor var_1564_transpose_y_0 = const()[name = tensor("op_1564_transpose_y_0"), val = tensor(false)]; + tensor transpose_139 = transpose(perm = var_1558, x = var_1557_cast); + tensor var_1564_cast = matmul(transpose_x = var_1564_transpose_x_0, transpose_y = var_1564_transpose_y_0, x = var_1562_cast, y = transpose_139); + tensor var_1565 = const()[name = tensor("op_1565"), val = tensor([0, 2, 1, 3])]; + tensor concat_13 = const()[name = tensor("concat_13"), val = tensor([1, 1500, 1024])]; + tensor transpose_136 = transpose(perm = var_1565, x = var_1564_cast); + tensor x_167_cast = reshape(shape = concat_13, x = transpose_136); + tensor var_1570_to_fp16 = const()[name = tensor("op_1570_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(343676800)))]; + tensor var_1571_to_fp16 = const()[name = tensor("op_1571_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345774016)))]; + tensor var_1572_cast = linear(bias = var_1571_to_fp16, weight = var_1570_to_fp16, x = x_167_cast); + tensor x_169_cast = add(x = x_163_cast, y = var_1572_cast); + tensor var_1578_axes_0 = const()[name = tensor("op_1578_axes_0"), val = tensor([-1])]; + tensor blocks_13_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_13_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345776128)))]; + tensor blocks_13_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_13_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345778240)))]; + tensor var_1578_cast = layer_norm(axes = var_1578_axes_0, beta = blocks_13_mlp_ln_bias_to_fp16, epsilon = var_1503_to_fp16, gamma = blocks_13_mlp_ln_weight_to_fp16, x = x_169_cast); + tensor var_1587_to_fp16 = const()[name = tensor("op_1587_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345780352)))]; + tensor var_1588_to_fp16 = const()[name = tensor("op_1588_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354169024)))]; + tensor input_113_cast = linear(bias = var_1588_to_fp16, weight = var_1587_to_fp16, x = var_1578_cast); + tensor x_173_mode_0 = const()[name = tensor("x_173_mode_0"), val = tensor("EXACT")]; + tensor x_173_cast = gelu(mode = x_173_mode_0, x = input_113_cast); + tensor var_1593_to_fp16 = const()[name = tensor("op_1593_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354177280)))]; + tensor var_1594_to_fp16 = const()[name = tensor("op_1594_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362565952)))]; + tensor var_1595_cast = linear(bias = var_1594_to_fp16, weight = var_1593_to_fp16, x = x_173_cast); + tensor x_175_cast = add(x = x_169_cast, y = var_1595_cast); + tensor var_1604 = const()[name = tensor("op_1604"), val = tensor(-1)]; + tensor var_1621_axes_0 = const()[name = tensor("op_1621_axes_0"), val = tensor([-1])]; + tensor blocks_14_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_14_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362568064)))]; + tensor blocks_14_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_14_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362570176)))]; + tensor var_1610_to_fp16 = const()[name = tensor("op_1610_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1621_cast = layer_norm(axes = var_1621_axes_0, beta = blocks_14_attn_ln_bias_to_fp16, epsilon = var_1610_to_fp16, gamma = blocks_14_attn_ln_weight_to_fp16, x = x_175_cast); + tensor var_1632_to_fp16 = const()[name = tensor("op_1632_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362572288)))]; + tensor var_1633_to_fp16 = const()[name = tensor("op_1633_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(364669504)))]; + tensor q_57_cast = linear(bias = var_1633_to_fp16, weight = var_1632_to_fp16, x = var_1621_cast); + tensor var_1636_to_fp16 = const()[name = tensor("op_1636_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(364671616)))]; + tensor k_57_bias_0_to_fp16 = const()[name = tensor("k_57_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(366768832)))]; + tensor k_57_cast = linear(bias = k_57_bias_0_to_fp16, weight = var_1636_to_fp16, x = var_1621_cast); + tensor var_1640_to_fp16 = const()[name = tensor("op_1640_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(366770944)))]; + tensor var_1641_to_fp16 = const()[name = tensor("op_1641_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368868160)))]; + tensor v_57_cast = linear(bias = var_1641_to_fp16, weight = var_1640_to_fp16, x = var_1621_cast); + tensor var_1649 = const()[name = tensor("op_1649"), val = tensor([1, 1500, 16, -1])]; + tensor var_1650_cast = reshape(shape = var_1649, x = q_57_cast); + tensor const_196_to_fp16 = const()[name = tensor("const_196_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_59_cast = mul(x = var_1650_cast, y = const_196_to_fp16); + tensor var_1656 = const()[name = tensor("op_1656"), val = tensor([1, 1500, 16, -1])]; + tensor var_1657_cast = reshape(shape = var_1656, x = k_57_cast); + tensor const_197_to_fp16 = const()[name = tensor("const_197_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_59_cast = mul(x = var_1657_cast, y = const_197_to_fp16); + tensor var_1663 = const()[name = tensor("op_1663"), val = tensor([1, 1500, 16, -1])]; + tensor var_1664_cast = reshape(shape = var_1663, x = v_57_cast); + tensor var_1665 = const()[name = tensor("op_1665"), val = tensor([0, 2, 1, 3])]; + tensor qk_29_transpose_x_0 = const()[name = tensor("qk_29_transpose_x_0"), val = tensor(false)]; + tensor qk_29_transpose_y_0 = const()[name = tensor("qk_29_transpose_y_0"), val = tensor(false)]; + tensor transpose_76_perm_0 = const()[name = tensor("transpose_76_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_77_perm_0 = const()[name = tensor("transpose_77_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_133 = transpose(perm = transpose_77_perm_0, x = k_59_cast); + tensor transpose_134 = transpose(perm = transpose_76_perm_0, x = q_59_cast); + tensor qk_29_cast = matmul(transpose_x = qk_29_transpose_x_0, transpose_y = qk_29_transpose_y_0, x = transpose_134, y = transpose_133); + tensor var_1669_cast = softmax(axis = var_1604, x = qk_29_cast); + tensor var_1671_transpose_x_0 = const()[name = tensor("op_1671_transpose_x_0"), val = tensor(false)]; + tensor var_1671_transpose_y_0 = const()[name = tensor("op_1671_transpose_y_0"), val = tensor(false)]; + tensor transpose_135 = transpose(perm = var_1665, x = var_1664_cast); + tensor var_1671_cast = matmul(transpose_x = var_1671_transpose_x_0, transpose_y = var_1671_transpose_y_0, x = var_1669_cast, y = transpose_135); + tensor var_1672 = const()[name = tensor("op_1672"), val = tensor([0, 2, 1, 3])]; + tensor concat_14 = const()[name = tensor("concat_14"), val = tensor([1, 1500, 1024])]; + tensor transpose_132 = transpose(perm = var_1672, x = var_1671_cast); + tensor x_179_cast = reshape(shape = concat_14, x = transpose_132); + tensor var_1677_to_fp16 = const()[name = tensor("op_1677_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368870272)))]; + tensor var_1678_to_fp16 = const()[name = tensor("op_1678_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370967488)))]; + tensor var_1679_cast = linear(bias = var_1678_to_fp16, weight = var_1677_to_fp16, x = x_179_cast); + tensor x_181_cast = add(x = x_175_cast, y = var_1679_cast); + tensor var_1685_axes_0 = const()[name = tensor("op_1685_axes_0"), val = tensor([-1])]; + tensor blocks_14_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_14_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370969600)))]; + tensor blocks_14_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_14_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370971712)))]; + tensor var_1685_cast = layer_norm(axes = var_1685_axes_0, beta = blocks_14_mlp_ln_bias_to_fp16, epsilon = var_1610_to_fp16, gamma = blocks_14_mlp_ln_weight_to_fp16, x = x_181_cast); + tensor var_1694_to_fp16 = const()[name = tensor("op_1694_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370973824)))]; + tensor var_1695_to_fp16 = const()[name = tensor("op_1695_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(379362496)))]; + tensor input_121_cast = linear(bias = var_1695_to_fp16, weight = var_1694_to_fp16, x = var_1685_cast); + tensor x_185_mode_0 = const()[name = tensor("x_185_mode_0"), val = tensor("EXACT")]; + tensor x_185_cast = gelu(mode = x_185_mode_0, x = input_121_cast); + tensor var_1700_to_fp16 = const()[name = tensor("op_1700_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(379370752)))]; + tensor var_1701_to_fp16 = const()[name = tensor("op_1701_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387759424)))]; + tensor var_1702_cast = linear(bias = var_1701_to_fp16, weight = var_1700_to_fp16, x = x_185_cast); + tensor x_187_cast = add(x = x_181_cast, y = var_1702_cast); + tensor var_1711 = const()[name = tensor("op_1711"), val = tensor(-1)]; + tensor var_1728_axes_0 = const()[name = tensor("op_1728_axes_0"), val = tensor([-1])]; + tensor blocks_15_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_15_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387761536)))]; + tensor blocks_15_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_15_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387763648)))]; + tensor var_1717_to_fp16 = const()[name = tensor("op_1717_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1728_cast = layer_norm(axes = var_1728_axes_0, beta = blocks_15_attn_ln_bias_to_fp16, epsilon = var_1717_to_fp16, gamma = blocks_15_attn_ln_weight_to_fp16, x = x_187_cast); + tensor var_1739_to_fp16 = const()[name = tensor("op_1739_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387765760)))]; + tensor var_1740_to_fp16 = const()[name = tensor("op_1740_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(389862976)))]; + tensor q_61_cast = linear(bias = var_1740_to_fp16, weight = var_1739_to_fp16, x = var_1728_cast); + tensor var_1743_to_fp16 = const()[name = tensor("op_1743_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(389865088)))]; + tensor k_61_bias_0_to_fp16 = const()[name = tensor("k_61_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(391962304)))]; + tensor k_61_cast = linear(bias = k_61_bias_0_to_fp16, weight = var_1743_to_fp16, x = var_1728_cast); + tensor var_1747_to_fp16 = const()[name = tensor("op_1747_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(391964416)))]; + tensor var_1748_to_fp16 = const()[name = tensor("op_1748_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394061632)))]; + tensor v_61_cast = linear(bias = var_1748_to_fp16, weight = var_1747_to_fp16, x = var_1728_cast); + tensor var_1756 = const()[name = tensor("op_1756"), val = tensor([1, 1500, 16, -1])]; + tensor var_1757_cast = reshape(shape = var_1756, x = q_61_cast); + tensor const_198_to_fp16 = const()[name = tensor("const_198_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_63_cast = mul(x = var_1757_cast, y = const_198_to_fp16); + tensor var_1763 = const()[name = tensor("op_1763"), val = tensor([1, 1500, 16, -1])]; + tensor var_1764_cast = reshape(shape = var_1763, x = k_61_cast); + tensor const_199_to_fp16 = const()[name = tensor("const_199_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_63_cast = mul(x = var_1764_cast, y = const_199_to_fp16); + tensor var_1770 = const()[name = tensor("op_1770"), val = tensor([1, 1500, 16, -1])]; + tensor var_1771_cast = reshape(shape = var_1770, x = v_61_cast); + tensor var_1772 = const()[name = tensor("op_1772"), val = tensor([0, 2, 1, 3])]; + tensor qk_31_transpose_x_0 = const()[name = tensor("qk_31_transpose_x_0"), val = tensor(false)]; + tensor qk_31_transpose_y_0 = const()[name = tensor("qk_31_transpose_y_0"), val = tensor(false)]; + tensor transpose_78_perm_0 = const()[name = tensor("transpose_78_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_79_perm_0 = const()[name = tensor("transpose_79_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_129 = transpose(perm = transpose_79_perm_0, x = k_63_cast); + tensor transpose_130 = transpose(perm = transpose_78_perm_0, x = q_63_cast); + tensor qk_31_cast = matmul(transpose_x = qk_31_transpose_x_0, transpose_y = qk_31_transpose_y_0, x = transpose_130, y = transpose_129); + tensor var_1776_cast = softmax(axis = var_1711, x = qk_31_cast); + tensor var_1778_transpose_x_0 = const()[name = tensor("op_1778_transpose_x_0"), val = tensor(false)]; + tensor var_1778_transpose_y_0 = const()[name = tensor("op_1778_transpose_y_0"), val = tensor(false)]; + tensor transpose_131 = transpose(perm = var_1772, x = var_1771_cast); + tensor var_1778_cast = matmul(transpose_x = var_1778_transpose_x_0, transpose_y = var_1778_transpose_y_0, x = var_1776_cast, y = transpose_131); + tensor var_1779 = const()[name = tensor("op_1779"), val = tensor([0, 2, 1, 3])]; + tensor concat_15 = const()[name = tensor("concat_15"), val = tensor([1, 1500, 1024])]; + tensor transpose_128 = transpose(perm = var_1779, x = var_1778_cast); + tensor x_191_cast = reshape(shape = concat_15, x = transpose_128); + tensor var_1784_to_fp16 = const()[name = tensor("op_1784_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394063744)))]; + tensor var_1785_to_fp16 = const()[name = tensor("op_1785_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(396160960)))]; + tensor var_1786_cast = linear(bias = var_1785_to_fp16, weight = var_1784_to_fp16, x = x_191_cast); + tensor x_193_cast = add(x = x_187_cast, y = var_1786_cast); + tensor var_1792_axes_0 = const()[name = tensor("op_1792_axes_0"), val = tensor([-1])]; + tensor blocks_15_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_15_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(396163072)))]; + tensor blocks_15_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_15_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(396165184)))]; + tensor var_1792_cast = layer_norm(axes = var_1792_axes_0, beta = blocks_15_mlp_ln_bias_to_fp16, epsilon = var_1717_to_fp16, gamma = blocks_15_mlp_ln_weight_to_fp16, x = x_193_cast); + tensor var_1801_to_fp16 = const()[name = tensor("op_1801_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(396167296)))]; + tensor var_1802_to_fp16 = const()[name = tensor("op_1802_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(404555968)))]; + tensor input_129_cast = linear(bias = var_1802_to_fp16, weight = var_1801_to_fp16, x = var_1792_cast); + tensor x_197_mode_0 = const()[name = tensor("x_197_mode_0"), val = tensor("EXACT")]; + tensor x_197_cast = gelu(mode = x_197_mode_0, x = input_129_cast); + tensor var_1807_to_fp16 = const()[name = tensor("op_1807_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(404564224)))]; + tensor var_1808_to_fp16 = const()[name = tensor("op_1808_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412952896)))]; + tensor var_1809_cast = linear(bias = var_1808_to_fp16, weight = var_1807_to_fp16, x = x_197_cast); + tensor x_199_cast = add(x = x_193_cast, y = var_1809_cast); + tensor var_1818 = const()[name = tensor("op_1818"), val = tensor(-1)]; + tensor var_1835_axes_0 = const()[name = tensor("op_1835_axes_0"), val = tensor([-1])]; + tensor blocks_16_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_16_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412955008)))]; + tensor blocks_16_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_16_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412957120)))]; + tensor var_1824_to_fp16 = const()[name = tensor("op_1824_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1835_cast = layer_norm(axes = var_1835_axes_0, beta = blocks_16_attn_ln_bias_to_fp16, epsilon = var_1824_to_fp16, gamma = blocks_16_attn_ln_weight_to_fp16, x = x_199_cast); + tensor var_1846_to_fp16 = const()[name = tensor("op_1846_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412959232)))]; + tensor var_1847_to_fp16 = const()[name = tensor("op_1847_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415056448)))]; + tensor q_65_cast = linear(bias = var_1847_to_fp16, weight = var_1846_to_fp16, x = var_1835_cast); + tensor var_1850_to_fp16 = const()[name = tensor("op_1850_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415058560)))]; + tensor k_65_bias_0_to_fp16 = const()[name = tensor("k_65_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(417155776)))]; + tensor k_65_cast = linear(bias = k_65_bias_0_to_fp16, weight = var_1850_to_fp16, x = var_1835_cast); + tensor var_1854_to_fp16 = const()[name = tensor("op_1854_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(417157888)))]; + tensor var_1855_to_fp16 = const()[name = tensor("op_1855_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419255104)))]; + tensor v_65_cast = linear(bias = var_1855_to_fp16, weight = var_1854_to_fp16, x = var_1835_cast); + tensor var_1863 = const()[name = tensor("op_1863"), val = tensor([1, 1500, 16, -1])]; + tensor var_1864_cast = reshape(shape = var_1863, x = q_65_cast); + tensor const_200_to_fp16 = const()[name = tensor("const_200_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_67_cast = mul(x = var_1864_cast, y = const_200_to_fp16); + tensor var_1870 = const()[name = tensor("op_1870"), val = tensor([1, 1500, 16, -1])]; + tensor var_1871_cast = reshape(shape = var_1870, x = k_65_cast); + tensor const_201_to_fp16 = const()[name = tensor("const_201_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_67_cast = mul(x = var_1871_cast, y = const_201_to_fp16); + tensor var_1877 = const()[name = tensor("op_1877"), val = tensor([1, 1500, 16, -1])]; + tensor var_1878_cast = reshape(shape = var_1877, x = v_65_cast); + tensor var_1879 = const()[name = tensor("op_1879"), val = tensor([0, 2, 1, 3])]; + tensor qk_33_transpose_x_0 = const()[name = tensor("qk_33_transpose_x_0"), val = tensor(false)]; + tensor qk_33_transpose_y_0 = const()[name = tensor("qk_33_transpose_y_0"), val = tensor(false)]; + tensor transpose_80_perm_0 = const()[name = tensor("transpose_80_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_81_perm_0 = const()[name = tensor("transpose_81_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_125 = transpose(perm = transpose_81_perm_0, x = k_67_cast); + tensor transpose_126 = transpose(perm = transpose_80_perm_0, x = q_67_cast); + tensor qk_33_cast = matmul(transpose_x = qk_33_transpose_x_0, transpose_y = qk_33_transpose_y_0, x = transpose_126, y = transpose_125); + tensor var_1883_cast = softmax(axis = var_1818, x = qk_33_cast); + tensor var_1885_transpose_x_0 = const()[name = tensor("op_1885_transpose_x_0"), val = tensor(false)]; + tensor var_1885_transpose_y_0 = const()[name = tensor("op_1885_transpose_y_0"), val = tensor(false)]; + tensor transpose_127 = transpose(perm = var_1879, x = var_1878_cast); + tensor var_1885_cast = matmul(transpose_x = var_1885_transpose_x_0, transpose_y = var_1885_transpose_y_0, x = var_1883_cast, y = transpose_127); + tensor var_1886 = const()[name = tensor("op_1886"), val = tensor([0, 2, 1, 3])]; + tensor concat_16 = const()[name = tensor("concat_16"), val = tensor([1, 1500, 1024])]; + tensor transpose_124 = transpose(perm = var_1886, x = var_1885_cast); + tensor x_203_cast = reshape(shape = concat_16, x = transpose_124); + tensor var_1891_to_fp16 = const()[name = tensor("op_1891_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419257216)))]; + tensor var_1892_to_fp16 = const()[name = tensor("op_1892_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421354432)))]; + tensor var_1893_cast = linear(bias = var_1892_to_fp16, weight = var_1891_to_fp16, x = x_203_cast); + tensor x_205_cast = add(x = x_199_cast, y = var_1893_cast); + tensor var_1899_axes_0 = const()[name = tensor("op_1899_axes_0"), val = tensor([-1])]; + tensor blocks_16_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_16_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421356544)))]; + tensor blocks_16_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_16_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421358656)))]; + tensor var_1899_cast = layer_norm(axes = var_1899_axes_0, beta = blocks_16_mlp_ln_bias_to_fp16, epsilon = var_1824_to_fp16, gamma = blocks_16_mlp_ln_weight_to_fp16, x = x_205_cast); + tensor var_1908_to_fp16 = const()[name = tensor("op_1908_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421360768)))]; + tensor var_1909_to_fp16 = const()[name = tensor("op_1909_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(429749440)))]; + tensor input_137_cast = linear(bias = var_1909_to_fp16, weight = var_1908_to_fp16, x = var_1899_cast); + tensor x_209_mode_0 = const()[name = tensor("x_209_mode_0"), val = tensor("EXACT")]; + tensor x_209_cast = gelu(mode = x_209_mode_0, x = input_137_cast); + tensor var_1914_to_fp16 = const()[name = tensor("op_1914_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(429757696)))]; + tensor var_1915_to_fp16 = const()[name = tensor("op_1915_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(438146368)))]; + tensor var_1916_cast = linear(bias = var_1915_to_fp16, weight = var_1914_to_fp16, x = x_209_cast); + tensor x_211_cast = add(x = x_205_cast, y = var_1916_cast); + tensor var_1925 = const()[name = tensor("op_1925"), val = tensor(-1)]; + tensor var_1942_axes_0 = const()[name = tensor("op_1942_axes_0"), val = tensor([-1])]; + tensor blocks_17_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_17_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(438148480)))]; + tensor blocks_17_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_17_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(438150592)))]; + tensor var_1931_to_fp16 = const()[name = tensor("op_1931_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_1942_cast = layer_norm(axes = var_1942_axes_0, beta = blocks_17_attn_ln_bias_to_fp16, epsilon = var_1931_to_fp16, gamma = blocks_17_attn_ln_weight_to_fp16, x = x_211_cast); + tensor var_1953_to_fp16 = const()[name = tensor("op_1953_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(438152704)))]; + tensor var_1954_to_fp16 = const()[name = tensor("op_1954_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(440249920)))]; + tensor q_69_cast = linear(bias = var_1954_to_fp16, weight = var_1953_to_fp16, x = var_1942_cast); + tensor var_1957_to_fp16 = const()[name = tensor("op_1957_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(440252032)))]; + tensor k_69_bias_0_to_fp16 = const()[name = tensor("k_69_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442349248)))]; + tensor k_69_cast = linear(bias = k_69_bias_0_to_fp16, weight = var_1957_to_fp16, x = var_1942_cast); + tensor var_1961_to_fp16 = const()[name = tensor("op_1961_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442351360)))]; + tensor var_1962_to_fp16 = const()[name = tensor("op_1962_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(444448576)))]; + tensor v_69_cast = linear(bias = var_1962_to_fp16, weight = var_1961_to_fp16, x = var_1942_cast); + tensor var_1970 = const()[name = tensor("op_1970"), val = tensor([1, 1500, 16, -1])]; + tensor var_1971_cast = reshape(shape = var_1970, x = q_69_cast); + tensor const_202_to_fp16 = const()[name = tensor("const_202_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_71_cast = mul(x = var_1971_cast, y = const_202_to_fp16); + tensor var_1977 = const()[name = tensor("op_1977"), val = tensor([1, 1500, 16, -1])]; + tensor var_1978_cast = reshape(shape = var_1977, x = k_69_cast); + tensor const_203_to_fp16 = const()[name = tensor("const_203_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_71_cast = mul(x = var_1978_cast, y = const_203_to_fp16); + tensor var_1984 = const()[name = tensor("op_1984"), val = tensor([1, 1500, 16, -1])]; + tensor var_1985_cast = reshape(shape = var_1984, x = v_69_cast); + tensor var_1986 = const()[name = tensor("op_1986"), val = tensor([0, 2, 1, 3])]; + tensor qk_35_transpose_x_0 = const()[name = tensor("qk_35_transpose_x_0"), val = tensor(false)]; + tensor qk_35_transpose_y_0 = const()[name = tensor("qk_35_transpose_y_0"), val = tensor(false)]; + tensor transpose_82_perm_0 = const()[name = tensor("transpose_82_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_83_perm_0 = const()[name = tensor("transpose_83_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_121 = transpose(perm = transpose_83_perm_0, x = k_71_cast); + tensor transpose_122 = transpose(perm = transpose_82_perm_0, x = q_71_cast); + tensor qk_35_cast = matmul(transpose_x = qk_35_transpose_x_0, transpose_y = qk_35_transpose_y_0, x = transpose_122, y = transpose_121); + tensor var_1990_cast = softmax(axis = var_1925, x = qk_35_cast); + tensor var_1992_transpose_x_0 = const()[name = tensor("op_1992_transpose_x_0"), val = tensor(false)]; + tensor var_1992_transpose_y_0 = const()[name = tensor("op_1992_transpose_y_0"), val = tensor(false)]; + tensor transpose_123 = transpose(perm = var_1986, x = var_1985_cast); + tensor var_1992_cast = matmul(transpose_x = var_1992_transpose_x_0, transpose_y = var_1992_transpose_y_0, x = var_1990_cast, y = transpose_123); + tensor var_1993 = const()[name = tensor("op_1993"), val = tensor([0, 2, 1, 3])]; + tensor concat_17 = const()[name = tensor("concat_17"), val = tensor([1, 1500, 1024])]; + tensor transpose_120 = transpose(perm = var_1993, x = var_1992_cast); + tensor x_215_cast = reshape(shape = concat_17, x = transpose_120); + tensor var_1998_to_fp16 = const()[name = tensor("op_1998_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(444450688)))]; + tensor var_1999_to_fp16 = const()[name = tensor("op_1999_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446547904)))]; + tensor var_2000_cast = linear(bias = var_1999_to_fp16, weight = var_1998_to_fp16, x = x_215_cast); + tensor x_217_cast = add(x = x_211_cast, y = var_2000_cast); + tensor var_2006_axes_0 = const()[name = tensor("op_2006_axes_0"), val = tensor([-1])]; + tensor blocks_17_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_17_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446550016)))]; + tensor blocks_17_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_17_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446552128)))]; + tensor var_2006_cast = layer_norm(axes = var_2006_axes_0, beta = blocks_17_mlp_ln_bias_to_fp16, epsilon = var_1931_to_fp16, gamma = blocks_17_mlp_ln_weight_to_fp16, x = x_217_cast); + tensor var_2015_to_fp16 = const()[name = tensor("op_2015_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446554240)))]; + tensor var_2016_to_fp16 = const()[name = tensor("op_2016_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454942912)))]; + tensor input_145_cast = linear(bias = var_2016_to_fp16, weight = var_2015_to_fp16, x = var_2006_cast); + tensor x_221_mode_0 = const()[name = tensor("x_221_mode_0"), val = tensor("EXACT")]; + tensor x_221_cast = gelu(mode = x_221_mode_0, x = input_145_cast); + tensor var_2021_to_fp16 = const()[name = tensor("op_2021_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454951168)))]; + tensor var_2022_to_fp16 = const()[name = tensor("op_2022_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(463339840)))]; + tensor var_2023_cast = linear(bias = var_2022_to_fp16, weight = var_2021_to_fp16, x = x_221_cast); + tensor x_223_cast = add(x = x_217_cast, y = var_2023_cast); + tensor var_2032 = const()[name = tensor("op_2032"), val = tensor(-1)]; + tensor var_2049_axes_0 = const()[name = tensor("op_2049_axes_0"), val = tensor([-1])]; + tensor blocks_18_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_18_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(463341952)))]; + tensor blocks_18_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_18_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(463344064)))]; + tensor var_2038_to_fp16 = const()[name = tensor("op_2038_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_2049_cast = layer_norm(axes = var_2049_axes_0, beta = blocks_18_attn_ln_bias_to_fp16, epsilon = var_2038_to_fp16, gamma = blocks_18_attn_ln_weight_to_fp16, x = x_223_cast); + tensor var_2060_to_fp16 = const()[name = tensor("op_2060_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(463346176)))]; + tensor var_2061_to_fp16 = const()[name = tensor("op_2061_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(465443392)))]; + tensor q_73_cast = linear(bias = var_2061_to_fp16, weight = var_2060_to_fp16, x = var_2049_cast); + tensor var_2064_to_fp16 = const()[name = tensor("op_2064_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(465445504)))]; + tensor k_73_bias_0_to_fp16 = const()[name = tensor("k_73_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(467542720)))]; + tensor k_73_cast = linear(bias = k_73_bias_0_to_fp16, weight = var_2064_to_fp16, x = var_2049_cast); + tensor var_2068_to_fp16 = const()[name = tensor("op_2068_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(467544832)))]; + tensor var_2069_to_fp16 = const()[name = tensor("op_2069_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(469642048)))]; + tensor v_73_cast = linear(bias = var_2069_to_fp16, weight = var_2068_to_fp16, x = var_2049_cast); + tensor var_2077 = const()[name = tensor("op_2077"), val = tensor([1, 1500, 16, -1])]; + tensor var_2078_cast = reshape(shape = var_2077, x = q_73_cast); + tensor const_204_to_fp16 = const()[name = tensor("const_204_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_75_cast = mul(x = var_2078_cast, y = const_204_to_fp16); + tensor var_2084 = const()[name = tensor("op_2084"), val = tensor([1, 1500, 16, -1])]; + tensor var_2085_cast = reshape(shape = var_2084, x = k_73_cast); + tensor const_205_to_fp16 = const()[name = tensor("const_205_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_75_cast = mul(x = var_2085_cast, y = const_205_to_fp16); + tensor var_2091 = const()[name = tensor("op_2091"), val = tensor([1, 1500, 16, -1])]; + tensor var_2092_cast = reshape(shape = var_2091, x = v_73_cast); + tensor var_2093 = const()[name = tensor("op_2093"), val = tensor([0, 2, 1, 3])]; + tensor qk_37_transpose_x_0 = const()[name = tensor("qk_37_transpose_x_0"), val = tensor(false)]; + tensor qk_37_transpose_y_0 = const()[name = tensor("qk_37_transpose_y_0"), val = tensor(false)]; + tensor transpose_84_perm_0 = const()[name = tensor("transpose_84_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_85_perm_0 = const()[name = tensor("transpose_85_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_117 = transpose(perm = transpose_85_perm_0, x = k_75_cast); + tensor transpose_118 = transpose(perm = transpose_84_perm_0, x = q_75_cast); + tensor qk_37_cast = matmul(transpose_x = qk_37_transpose_x_0, transpose_y = qk_37_transpose_y_0, x = transpose_118, y = transpose_117); + tensor var_2097_cast = softmax(axis = var_2032, x = qk_37_cast); + tensor var_2099_transpose_x_0 = const()[name = tensor("op_2099_transpose_x_0"), val = tensor(false)]; + tensor var_2099_transpose_y_0 = const()[name = tensor("op_2099_transpose_y_0"), val = tensor(false)]; + tensor transpose_119 = transpose(perm = var_2093, x = var_2092_cast); + tensor var_2099_cast = matmul(transpose_x = var_2099_transpose_x_0, transpose_y = var_2099_transpose_y_0, x = var_2097_cast, y = transpose_119); + tensor var_2100 = const()[name = tensor("op_2100"), val = tensor([0, 2, 1, 3])]; + tensor concat_18 = const()[name = tensor("concat_18"), val = tensor([1, 1500, 1024])]; + tensor transpose_116 = transpose(perm = var_2100, x = var_2099_cast); + tensor x_227_cast = reshape(shape = concat_18, x = transpose_116); + tensor var_2105_to_fp16 = const()[name = tensor("op_2105_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(469644160)))]; + tensor var_2106_to_fp16 = const()[name = tensor("op_2106_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(471741376)))]; + tensor var_2107_cast = linear(bias = var_2106_to_fp16, weight = var_2105_to_fp16, x = x_227_cast); + tensor x_229_cast = add(x = x_223_cast, y = var_2107_cast); + tensor var_2113_axes_0 = const()[name = tensor("op_2113_axes_0"), val = tensor([-1])]; + tensor blocks_18_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_18_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(471743488)))]; + tensor blocks_18_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_18_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(471745600)))]; + tensor var_2113_cast = layer_norm(axes = var_2113_axes_0, beta = blocks_18_mlp_ln_bias_to_fp16, epsilon = var_2038_to_fp16, gamma = blocks_18_mlp_ln_weight_to_fp16, x = x_229_cast); + tensor var_2122_to_fp16 = const()[name = tensor("op_2122_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(471747712)))]; + tensor var_2123_to_fp16 = const()[name = tensor("op_2123_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(480136384)))]; + tensor input_153_cast = linear(bias = var_2123_to_fp16, weight = var_2122_to_fp16, x = var_2113_cast); + tensor x_233_mode_0 = const()[name = tensor("x_233_mode_0"), val = tensor("EXACT")]; + tensor x_233_cast = gelu(mode = x_233_mode_0, x = input_153_cast); + tensor var_2128_to_fp16 = const()[name = tensor("op_2128_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(480144640)))]; + tensor var_2129_to_fp16 = const()[name = tensor("op_2129_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488533312)))]; + tensor var_2130_cast = linear(bias = var_2129_to_fp16, weight = var_2128_to_fp16, x = x_233_cast); + tensor x_235_cast = add(x = x_229_cast, y = var_2130_cast); + tensor var_2139 = const()[name = tensor("op_2139"), val = tensor(-1)]; + tensor var_2156_axes_0 = const()[name = tensor("op_2156_axes_0"), val = tensor([-1])]; + tensor blocks_19_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_19_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488535424)))]; + tensor blocks_19_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_19_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488537536)))]; + tensor var_2145_to_fp16 = const()[name = tensor("op_2145_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_2156_cast = layer_norm(axes = var_2156_axes_0, beta = blocks_19_attn_ln_bias_to_fp16, epsilon = var_2145_to_fp16, gamma = blocks_19_attn_ln_weight_to_fp16, x = x_235_cast); + tensor var_2167_to_fp16 = const()[name = tensor("op_2167_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488539648)))]; + tensor var_2168_to_fp16 = const()[name = tensor("op_2168_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490636864)))]; + tensor q_77_cast = linear(bias = var_2168_to_fp16, weight = var_2167_to_fp16, x = var_2156_cast); + tensor var_2171_to_fp16 = const()[name = tensor("op_2171_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490638976)))]; + tensor k_77_bias_0_to_fp16 = const()[name = tensor("k_77_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492736192)))]; + tensor k_77_cast = linear(bias = k_77_bias_0_to_fp16, weight = var_2171_to_fp16, x = var_2156_cast); + tensor var_2175_to_fp16 = const()[name = tensor("op_2175_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492738304)))]; + tensor var_2176_to_fp16 = const()[name = tensor("op_2176_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(494835520)))]; + tensor v_77_cast = linear(bias = var_2176_to_fp16, weight = var_2175_to_fp16, x = var_2156_cast); + tensor var_2184 = const()[name = tensor("op_2184"), val = tensor([1, 1500, 16, -1])]; + tensor var_2185_cast = reshape(shape = var_2184, x = q_77_cast); + tensor const_206_to_fp16 = const()[name = tensor("const_206_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_79_cast = mul(x = var_2185_cast, y = const_206_to_fp16); + tensor var_2191 = const()[name = tensor("op_2191"), val = tensor([1, 1500, 16, -1])]; + tensor var_2192_cast = reshape(shape = var_2191, x = k_77_cast); + tensor const_207_to_fp16 = const()[name = tensor("const_207_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_79_cast = mul(x = var_2192_cast, y = const_207_to_fp16); + tensor var_2198 = const()[name = tensor("op_2198"), val = tensor([1, 1500, 16, -1])]; + tensor var_2199_cast = reshape(shape = var_2198, x = v_77_cast); + tensor var_2200 = const()[name = tensor("op_2200"), val = tensor([0, 2, 1, 3])]; + tensor qk_39_transpose_x_0 = const()[name = tensor("qk_39_transpose_x_0"), val = tensor(false)]; + tensor qk_39_transpose_y_0 = const()[name = tensor("qk_39_transpose_y_0"), val = tensor(false)]; + tensor transpose_86_perm_0 = const()[name = tensor("transpose_86_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_87_perm_0 = const()[name = tensor("transpose_87_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_113 = transpose(perm = transpose_87_perm_0, x = k_79_cast); + tensor transpose_114 = transpose(perm = transpose_86_perm_0, x = q_79_cast); + tensor qk_39_cast = matmul(transpose_x = qk_39_transpose_x_0, transpose_y = qk_39_transpose_y_0, x = transpose_114, y = transpose_113); + tensor var_2204_cast = softmax(axis = var_2139, x = qk_39_cast); + tensor var_2206_transpose_x_0 = const()[name = tensor("op_2206_transpose_x_0"), val = tensor(false)]; + tensor var_2206_transpose_y_0 = const()[name = tensor("op_2206_transpose_y_0"), val = tensor(false)]; + tensor transpose_115 = transpose(perm = var_2200, x = var_2199_cast); + tensor var_2206_cast = matmul(transpose_x = var_2206_transpose_x_0, transpose_y = var_2206_transpose_y_0, x = var_2204_cast, y = transpose_115); + tensor var_2207 = const()[name = tensor("op_2207"), val = tensor([0, 2, 1, 3])]; + tensor concat_19 = const()[name = tensor("concat_19"), val = tensor([1, 1500, 1024])]; + tensor transpose_112 = transpose(perm = var_2207, x = var_2206_cast); + tensor x_239_cast = reshape(shape = concat_19, x = transpose_112); + tensor var_2212_to_fp16 = const()[name = tensor("op_2212_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(494837632)))]; + tensor var_2213_to_fp16 = const()[name = tensor("op_2213_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496934848)))]; + tensor var_2214_cast = linear(bias = var_2213_to_fp16, weight = var_2212_to_fp16, x = x_239_cast); + tensor x_241_cast = add(x = x_235_cast, y = var_2214_cast); + tensor var_2220_axes_0 = const()[name = tensor("op_2220_axes_0"), val = tensor([-1])]; + tensor blocks_19_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_19_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496936960)))]; + tensor blocks_19_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_19_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496939072)))]; + tensor var_2220_cast = layer_norm(axes = var_2220_axes_0, beta = blocks_19_mlp_ln_bias_to_fp16, epsilon = var_2145_to_fp16, gamma = blocks_19_mlp_ln_weight_to_fp16, x = x_241_cast); + tensor var_2229_to_fp16 = const()[name = tensor("op_2229_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496941184)))]; + tensor var_2230_to_fp16 = const()[name = tensor("op_2230_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(505329856)))]; + tensor input_161_cast = linear(bias = var_2230_to_fp16, weight = var_2229_to_fp16, x = var_2220_cast); + tensor x_245_mode_0 = const()[name = tensor("x_245_mode_0"), val = tensor("EXACT")]; + tensor x_245_cast = gelu(mode = x_245_mode_0, x = input_161_cast); + tensor var_2235_to_fp16 = const()[name = tensor("op_2235_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(505338112)))]; + tensor var_2236_to_fp16 = const()[name = tensor("op_2236_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513726784)))]; + tensor var_2237_cast = linear(bias = var_2236_to_fp16, weight = var_2235_to_fp16, x = x_245_cast); + tensor x_247_cast = add(x = x_241_cast, y = var_2237_cast); + tensor var_2246 = const()[name = tensor("op_2246"), val = tensor(-1)]; + tensor var_2263_axes_0 = const()[name = tensor("op_2263_axes_0"), val = tensor([-1])]; + tensor blocks_20_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_20_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513728896)))]; + tensor blocks_20_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_20_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513731008)))]; + tensor var_2252_to_fp16 = const()[name = tensor("op_2252_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_2263_cast = layer_norm(axes = var_2263_axes_0, beta = blocks_20_attn_ln_bias_to_fp16, epsilon = var_2252_to_fp16, gamma = blocks_20_attn_ln_weight_to_fp16, x = x_247_cast); + tensor var_2274_to_fp16 = const()[name = tensor("op_2274_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513733120)))]; + tensor var_2275_to_fp16 = const()[name = tensor("op_2275_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(515830336)))]; + tensor q_81_cast = linear(bias = var_2275_to_fp16, weight = var_2274_to_fp16, x = var_2263_cast); + tensor var_2278_to_fp16 = const()[name = tensor("op_2278_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(515832448)))]; + tensor k_81_bias_0_to_fp16 = const()[name = tensor("k_81_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(517929664)))]; + tensor k_81_cast = linear(bias = k_81_bias_0_to_fp16, weight = var_2278_to_fp16, x = var_2263_cast); + tensor var_2282_to_fp16 = const()[name = tensor("op_2282_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(517931776)))]; + tensor var_2283_to_fp16 = const()[name = tensor("op_2283_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(520028992)))]; + tensor v_81_cast = linear(bias = var_2283_to_fp16, weight = var_2282_to_fp16, x = var_2263_cast); + tensor var_2291 = const()[name = tensor("op_2291"), val = tensor([1, 1500, 16, -1])]; + tensor var_2292_cast = reshape(shape = var_2291, x = q_81_cast); + tensor const_208_to_fp16 = const()[name = tensor("const_208_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_83_cast = mul(x = var_2292_cast, y = const_208_to_fp16); + tensor var_2298 = const()[name = tensor("op_2298"), val = tensor([1, 1500, 16, -1])]; + tensor var_2299_cast = reshape(shape = var_2298, x = k_81_cast); + tensor const_209_to_fp16 = const()[name = tensor("const_209_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_83_cast = mul(x = var_2299_cast, y = const_209_to_fp16); + tensor var_2305 = const()[name = tensor("op_2305"), val = tensor([1, 1500, 16, -1])]; + tensor var_2306_cast = reshape(shape = var_2305, x = v_81_cast); + tensor var_2307 = const()[name = tensor("op_2307"), val = tensor([0, 2, 1, 3])]; + tensor qk_41_transpose_x_0 = const()[name = tensor("qk_41_transpose_x_0"), val = tensor(false)]; + tensor qk_41_transpose_y_0 = const()[name = tensor("qk_41_transpose_y_0"), val = tensor(false)]; + tensor transpose_88_perm_0 = const()[name = tensor("transpose_88_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_89_perm_0 = const()[name = tensor("transpose_89_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_109 = transpose(perm = transpose_89_perm_0, x = k_83_cast); + tensor transpose_110 = transpose(perm = transpose_88_perm_0, x = q_83_cast); + tensor qk_41_cast = matmul(transpose_x = qk_41_transpose_x_0, transpose_y = qk_41_transpose_y_0, x = transpose_110, y = transpose_109); + tensor var_2311_cast = softmax(axis = var_2246, x = qk_41_cast); + tensor var_2313_transpose_x_0 = const()[name = tensor("op_2313_transpose_x_0"), val = tensor(false)]; + tensor var_2313_transpose_y_0 = const()[name = tensor("op_2313_transpose_y_0"), val = tensor(false)]; + tensor transpose_111 = transpose(perm = var_2307, x = var_2306_cast); + tensor var_2313_cast = matmul(transpose_x = var_2313_transpose_x_0, transpose_y = var_2313_transpose_y_0, x = var_2311_cast, y = transpose_111); + tensor var_2314 = const()[name = tensor("op_2314"), val = tensor([0, 2, 1, 3])]; + tensor concat_20 = const()[name = tensor("concat_20"), val = tensor([1, 1500, 1024])]; + tensor transpose_108 = transpose(perm = var_2314, x = var_2313_cast); + tensor x_251_cast = reshape(shape = concat_20, x = transpose_108); + tensor var_2319_to_fp16 = const()[name = tensor("op_2319_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(520031104)))]; + tensor var_2320_to_fp16 = const()[name = tensor("op_2320_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(522128320)))]; + tensor var_2321_cast = linear(bias = var_2320_to_fp16, weight = var_2319_to_fp16, x = x_251_cast); + tensor x_253_cast = add(x = x_247_cast, y = var_2321_cast); + tensor var_2327_axes_0 = const()[name = tensor("op_2327_axes_0"), val = tensor([-1])]; + tensor blocks_20_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_20_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(522130432)))]; + tensor blocks_20_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_20_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(522132544)))]; + tensor var_2327_cast = layer_norm(axes = var_2327_axes_0, beta = blocks_20_mlp_ln_bias_to_fp16, epsilon = var_2252_to_fp16, gamma = blocks_20_mlp_ln_weight_to_fp16, x = x_253_cast); + tensor var_2336_to_fp16 = const()[name = tensor("op_2336_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(522134656)))]; + tensor var_2337_to_fp16 = const()[name = tensor("op_2337_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(530523328)))]; + tensor input_169_cast = linear(bias = var_2337_to_fp16, weight = var_2336_to_fp16, x = var_2327_cast); + tensor x_257_mode_0 = const()[name = tensor("x_257_mode_0"), val = tensor("EXACT")]; + tensor x_257_cast = gelu(mode = x_257_mode_0, x = input_169_cast); + tensor var_2342_to_fp16 = const()[name = tensor("op_2342_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(530531584)))]; + tensor var_2343_to_fp16 = const()[name = tensor("op_2343_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538920256)))]; + tensor var_2344_cast = linear(bias = var_2343_to_fp16, weight = var_2342_to_fp16, x = x_257_cast); + tensor x_259_cast = add(x = x_253_cast, y = var_2344_cast); + tensor var_2353 = const()[name = tensor("op_2353"), val = tensor(-1)]; + tensor var_2370_axes_0 = const()[name = tensor("op_2370_axes_0"), val = tensor([-1])]; + tensor blocks_21_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_21_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538922368)))]; + tensor blocks_21_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_21_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538924480)))]; + tensor var_2359_to_fp16 = const()[name = tensor("op_2359_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_2370_cast = layer_norm(axes = var_2370_axes_0, beta = blocks_21_attn_ln_bias_to_fp16, epsilon = var_2359_to_fp16, gamma = blocks_21_attn_ln_weight_to_fp16, x = x_259_cast); + tensor var_2381_to_fp16 = const()[name = tensor("op_2381_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538926592)))]; + tensor var_2382_to_fp16 = const()[name = tensor("op_2382_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(541023808)))]; + tensor q_85_cast = linear(bias = var_2382_to_fp16, weight = var_2381_to_fp16, x = var_2370_cast); + tensor var_2385_to_fp16 = const()[name = tensor("op_2385_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(541025920)))]; + tensor k_85_bias_0_to_fp16 = const()[name = tensor("k_85_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(543123136)))]; + tensor k_85_cast = linear(bias = k_85_bias_0_to_fp16, weight = var_2385_to_fp16, x = var_2370_cast); + tensor var_2389_to_fp16 = const()[name = tensor("op_2389_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(543125248)))]; + tensor var_2390_to_fp16 = const()[name = tensor("op_2390_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(545222464)))]; + tensor v_85_cast = linear(bias = var_2390_to_fp16, weight = var_2389_to_fp16, x = var_2370_cast); + tensor var_2398 = const()[name = tensor("op_2398"), val = tensor([1, 1500, 16, -1])]; + tensor var_2399_cast = reshape(shape = var_2398, x = q_85_cast); + tensor const_210_to_fp16 = const()[name = tensor("const_210_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_87_cast = mul(x = var_2399_cast, y = const_210_to_fp16); + tensor var_2405 = const()[name = tensor("op_2405"), val = tensor([1, 1500, 16, -1])]; + tensor var_2406_cast = reshape(shape = var_2405, x = k_85_cast); + tensor const_211_to_fp16 = const()[name = tensor("const_211_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_87_cast = mul(x = var_2406_cast, y = const_211_to_fp16); + tensor var_2412 = const()[name = tensor("op_2412"), val = tensor([1, 1500, 16, -1])]; + tensor var_2413_cast = reshape(shape = var_2412, x = v_85_cast); + tensor var_2414 = const()[name = tensor("op_2414"), val = tensor([0, 2, 1, 3])]; + tensor qk_43_transpose_x_0 = const()[name = tensor("qk_43_transpose_x_0"), val = tensor(false)]; + tensor qk_43_transpose_y_0 = const()[name = tensor("qk_43_transpose_y_0"), val = tensor(false)]; + tensor transpose_90_perm_0 = const()[name = tensor("transpose_90_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_91_perm_0 = const()[name = tensor("transpose_91_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_105 = transpose(perm = transpose_91_perm_0, x = k_87_cast); + tensor transpose_106 = transpose(perm = transpose_90_perm_0, x = q_87_cast); + tensor qk_43_cast = matmul(transpose_x = qk_43_transpose_x_0, transpose_y = qk_43_transpose_y_0, x = transpose_106, y = transpose_105); + tensor var_2418_cast = softmax(axis = var_2353, x = qk_43_cast); + tensor var_2420_transpose_x_0 = const()[name = tensor("op_2420_transpose_x_0"), val = tensor(false)]; + tensor var_2420_transpose_y_0 = const()[name = tensor("op_2420_transpose_y_0"), val = tensor(false)]; + tensor transpose_107 = transpose(perm = var_2414, x = var_2413_cast); + tensor var_2420_cast = matmul(transpose_x = var_2420_transpose_x_0, transpose_y = var_2420_transpose_y_0, x = var_2418_cast, y = transpose_107); + tensor var_2421 = const()[name = tensor("op_2421"), val = tensor([0, 2, 1, 3])]; + tensor concat_21 = const()[name = tensor("concat_21"), val = tensor([1, 1500, 1024])]; + tensor transpose_104 = transpose(perm = var_2421, x = var_2420_cast); + tensor x_263_cast = reshape(shape = concat_21, x = transpose_104); + tensor var_2426_to_fp16 = const()[name = tensor("op_2426_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(545224576)))]; + tensor var_2427_to_fp16 = const()[name = tensor("op_2427_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547321792)))]; + tensor var_2428_cast = linear(bias = var_2427_to_fp16, weight = var_2426_to_fp16, x = x_263_cast); + tensor x_265_cast = add(x = x_259_cast, y = var_2428_cast); + tensor var_2434_axes_0 = const()[name = tensor("op_2434_axes_0"), val = tensor([-1])]; + tensor blocks_21_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_21_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547323904)))]; + tensor blocks_21_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_21_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547326016)))]; + tensor var_2434_cast = layer_norm(axes = var_2434_axes_0, beta = blocks_21_mlp_ln_bias_to_fp16, epsilon = var_2359_to_fp16, gamma = blocks_21_mlp_ln_weight_to_fp16, x = x_265_cast); + tensor var_2443_to_fp16 = const()[name = tensor("op_2443_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547328128)))]; + tensor var_2444_to_fp16 = const()[name = tensor("op_2444_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(555716800)))]; + tensor input_177_cast = linear(bias = var_2444_to_fp16, weight = var_2443_to_fp16, x = var_2434_cast); + tensor x_269_mode_0 = const()[name = tensor("x_269_mode_0"), val = tensor("EXACT")]; + tensor x_269_cast = gelu(mode = x_269_mode_0, x = input_177_cast); + tensor var_2449_to_fp16 = const()[name = tensor("op_2449_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(555725056)))]; + tensor var_2450_to_fp16 = const()[name = tensor("op_2450_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(564113728)))]; + tensor var_2451_cast = linear(bias = var_2450_to_fp16, weight = var_2449_to_fp16, x = x_269_cast); + tensor x_271_cast = add(x = x_265_cast, y = var_2451_cast); + tensor var_2460 = const()[name = tensor("op_2460"), val = tensor(-1)]; + tensor var_2477_axes_0 = const()[name = tensor("op_2477_axes_0"), val = tensor([-1])]; + tensor blocks_22_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_22_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(564115840)))]; + tensor blocks_22_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_22_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(564117952)))]; + tensor var_2466_to_fp16 = const()[name = tensor("op_2466_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_2477_cast = layer_norm(axes = var_2477_axes_0, beta = blocks_22_attn_ln_bias_to_fp16, epsilon = var_2466_to_fp16, gamma = blocks_22_attn_ln_weight_to_fp16, x = x_271_cast); + tensor var_2488_to_fp16 = const()[name = tensor("op_2488_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(564120064)))]; + tensor var_2489_to_fp16 = const()[name = tensor("op_2489_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(566217280)))]; + tensor q_89_cast = linear(bias = var_2489_to_fp16, weight = var_2488_to_fp16, x = var_2477_cast); + tensor var_2492_to_fp16 = const()[name = tensor("op_2492_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(566219392)))]; + tensor k_89_bias_0_to_fp16 = const()[name = tensor("k_89_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(568316608)))]; + tensor k_89_cast = linear(bias = k_89_bias_0_to_fp16, weight = var_2492_to_fp16, x = var_2477_cast); + tensor var_2496_to_fp16 = const()[name = tensor("op_2496_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(568318720)))]; + tensor var_2497_to_fp16 = const()[name = tensor("op_2497_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570415936)))]; + tensor v_89_cast = linear(bias = var_2497_to_fp16, weight = var_2496_to_fp16, x = var_2477_cast); + tensor var_2505 = const()[name = tensor("op_2505"), val = tensor([1, 1500, 16, -1])]; + tensor var_2506_cast = reshape(shape = var_2505, x = q_89_cast); + tensor const_212_to_fp16 = const()[name = tensor("const_212_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_91_cast = mul(x = var_2506_cast, y = const_212_to_fp16); + tensor var_2512 = const()[name = tensor("op_2512"), val = tensor([1, 1500, 16, -1])]; + tensor var_2513_cast = reshape(shape = var_2512, x = k_89_cast); + tensor const_213_to_fp16 = const()[name = tensor("const_213_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_91_cast = mul(x = var_2513_cast, y = const_213_to_fp16); + tensor var_2519 = const()[name = tensor("op_2519"), val = tensor([1, 1500, 16, -1])]; + tensor var_2520_cast = reshape(shape = var_2519, x = v_89_cast); + tensor var_2521 = const()[name = tensor("op_2521"), val = tensor([0, 2, 1, 3])]; + tensor qk_45_transpose_x_0 = const()[name = tensor("qk_45_transpose_x_0"), val = tensor(false)]; + tensor qk_45_transpose_y_0 = const()[name = tensor("qk_45_transpose_y_0"), val = tensor(false)]; + tensor transpose_92_perm_0 = const()[name = tensor("transpose_92_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_93_perm_0 = const()[name = tensor("transpose_93_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_101 = transpose(perm = transpose_93_perm_0, x = k_91_cast); + tensor transpose_102 = transpose(perm = transpose_92_perm_0, x = q_91_cast); + tensor qk_45_cast = matmul(transpose_x = qk_45_transpose_x_0, transpose_y = qk_45_transpose_y_0, x = transpose_102, y = transpose_101); + tensor var_2525_cast = softmax(axis = var_2460, x = qk_45_cast); + tensor var_2527_transpose_x_0 = const()[name = tensor("op_2527_transpose_x_0"), val = tensor(false)]; + tensor var_2527_transpose_y_0 = const()[name = tensor("op_2527_transpose_y_0"), val = tensor(false)]; + tensor transpose_103 = transpose(perm = var_2521, x = var_2520_cast); + tensor var_2527_cast = matmul(transpose_x = var_2527_transpose_x_0, transpose_y = var_2527_transpose_y_0, x = var_2525_cast, y = transpose_103); + tensor var_2528 = const()[name = tensor("op_2528"), val = tensor([0, 2, 1, 3])]; + tensor concat_22 = const()[name = tensor("concat_22"), val = tensor([1, 1500, 1024])]; + tensor transpose_100 = transpose(perm = var_2528, x = var_2527_cast); + tensor x_275_cast = reshape(shape = concat_22, x = transpose_100); + tensor var_2533_to_fp16 = const()[name = tensor("op_2533_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570418048)))]; + tensor var_2534_to_fp16 = const()[name = tensor("op_2534_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572515264)))]; + tensor var_2535_cast = linear(bias = var_2534_to_fp16, weight = var_2533_to_fp16, x = x_275_cast); + tensor x_277_cast = add(x = x_271_cast, y = var_2535_cast); + tensor var_2541_axes_0 = const()[name = tensor("op_2541_axes_0"), val = tensor([-1])]; + tensor blocks_22_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_22_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572517376)))]; + tensor blocks_22_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_22_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572519488)))]; + tensor var_2541_cast = layer_norm(axes = var_2541_axes_0, beta = blocks_22_mlp_ln_bias_to_fp16, epsilon = var_2466_to_fp16, gamma = blocks_22_mlp_ln_weight_to_fp16, x = x_277_cast); + tensor var_2550_to_fp16 = const()[name = tensor("op_2550_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572521600)))]; + tensor var_2551_to_fp16 = const()[name = tensor("op_2551_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(580910272)))]; + tensor input_185_cast = linear(bias = var_2551_to_fp16, weight = var_2550_to_fp16, x = var_2541_cast); + tensor x_281_mode_0 = const()[name = tensor("x_281_mode_0"), val = tensor("EXACT")]; + tensor x_281_cast = gelu(mode = x_281_mode_0, x = input_185_cast); + tensor var_2556_to_fp16 = const()[name = tensor("op_2556_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(580918528)))]; + tensor var_2557_to_fp16 = const()[name = tensor("op_2557_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589307200)))]; + tensor var_2558_cast = linear(bias = var_2557_to_fp16, weight = var_2556_to_fp16, x = x_281_cast); + tensor x_283_cast = add(x = x_277_cast, y = var_2558_cast); + tensor var_2567 = const()[name = tensor("op_2567"), val = tensor(-1)]; + tensor var_2584_axes_0 = const()[name = tensor("op_2584_axes_0"), val = tensor([-1])]; + tensor blocks_23_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_23_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589309312)))]; + tensor blocks_23_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_23_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589311424)))]; + tensor var_2573_to_fp16 = const()[name = tensor("op_2573_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_2584_cast = layer_norm(axes = var_2584_axes_0, beta = blocks_23_attn_ln_bias_to_fp16, epsilon = var_2573_to_fp16, gamma = blocks_23_attn_ln_weight_to_fp16, x = x_283_cast); + tensor var_2595_to_fp16 = const()[name = tensor("op_2595_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589313536)))]; + tensor var_2596_to_fp16 = const()[name = tensor("op_2596_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(591410752)))]; + tensor q_93_cast = linear(bias = var_2596_to_fp16, weight = var_2595_to_fp16, x = var_2584_cast); + tensor var_2599_to_fp16 = const()[name = tensor("op_2599_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(591412864)))]; + tensor k_93_bias_0_to_fp16 = const()[name = tensor("k_93_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(593510080)))]; + tensor k_93_cast = linear(bias = k_93_bias_0_to_fp16, weight = var_2599_to_fp16, x = var_2584_cast); + tensor var_2603_to_fp16 = const()[name = tensor("op_2603_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(593512192)))]; + tensor var_2604_to_fp16 = const()[name = tensor("op_2604_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(595609408)))]; + tensor v_93_cast = linear(bias = var_2604_to_fp16, weight = var_2603_to_fp16, x = var_2584_cast); + tensor var_2612 = const()[name = tensor("op_2612"), val = tensor([1, 1500, 16, -1])]; + tensor var_2613_cast = reshape(shape = var_2612, x = q_93_cast); + tensor const_214_to_fp16 = const()[name = tensor("const_214_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor q_cast = mul(x = var_2613_cast, y = const_214_to_fp16); + tensor var_2619 = const()[name = tensor("op_2619"), val = tensor([1, 1500, 16, -1])]; + tensor var_2620_cast = reshape(shape = var_2619, x = k_93_cast); + tensor const_215_to_fp16 = const()[name = tensor("const_215_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; + tensor k_cast = mul(x = var_2620_cast, y = const_215_to_fp16); + tensor var_2626 = const()[name = tensor("op_2626"), val = tensor([1, 1500, 16, -1])]; + tensor var_2627_cast = reshape(shape = var_2626, x = v_93_cast); + tensor var_2628 = const()[name = tensor("op_2628"), val = tensor([0, 2, 1, 3])]; + tensor qk_transpose_x_0 = const()[name = tensor("qk_transpose_x_0"), val = tensor(false)]; + tensor qk_transpose_y_0 = const()[name = tensor("qk_transpose_y_0"), val = tensor(false)]; + tensor transpose_94_perm_0 = const()[name = tensor("transpose_94_perm_0"), val = tensor([0, 2, 1, 3])]; + tensor transpose_95_perm_0 = const()[name = tensor("transpose_95_perm_0"), val = tensor([0, 2, 3, 1])]; + tensor transpose_97 = transpose(perm = transpose_95_perm_0, x = k_cast); + tensor transpose_98 = transpose(perm = transpose_94_perm_0, x = q_cast); + tensor qk_cast = matmul(transpose_x = qk_transpose_x_0, transpose_y = qk_transpose_y_0, x = transpose_98, y = transpose_97); + tensor var_2632_cast = softmax(axis = var_2567, x = qk_cast); + tensor var_2634_transpose_x_0 = const()[name = tensor("op_2634_transpose_x_0"), val = tensor(false)]; + tensor var_2634_transpose_y_0 = const()[name = tensor("op_2634_transpose_y_0"), val = tensor(false)]; + tensor transpose_99 = transpose(perm = var_2628, x = var_2627_cast); + tensor var_2634_cast = matmul(transpose_x = var_2634_transpose_x_0, transpose_y = var_2634_transpose_y_0, x = var_2632_cast, y = transpose_99); + tensor var_2635 = const()[name = tensor("op_2635"), val = tensor([0, 2, 1, 3])]; + tensor concat_23 = const()[name = tensor("concat_23"), val = tensor([1, 1500, 1024])]; + tensor transpose_96 = transpose(perm = var_2635, x = var_2634_cast); + tensor x_287_cast = reshape(shape = concat_23, x = transpose_96); + tensor var_2640_to_fp16 = const()[name = tensor("op_2640_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(595611520)))]; + tensor var_2641_to_fp16 = const()[name = tensor("op_2641_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(597708736)))]; + tensor var_2642_cast = linear(bias = var_2641_to_fp16, weight = var_2640_to_fp16, x = x_287_cast); + tensor x_289_cast = add(x = x_283_cast, y = var_2642_cast); + tensor var_2648_axes_0 = const()[name = tensor("op_2648_axes_0"), val = tensor([-1])]; + tensor blocks_23_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_23_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(597710848)))]; + tensor blocks_23_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_23_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(597712960)))]; + tensor var_2648_cast = layer_norm(axes = var_2648_axes_0, beta = blocks_23_mlp_ln_bias_to_fp16, epsilon = var_2573_to_fp16, gamma = blocks_23_mlp_ln_weight_to_fp16, x = x_289_cast); + tensor var_2657_to_fp16 = const()[name = tensor("op_2657_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(597715072)))]; + tensor var_2658_to_fp16 = const()[name = tensor("op_2658_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(606103744)))]; + tensor input_193_cast = linear(bias = var_2658_to_fp16, weight = var_2657_to_fp16, x = var_2648_cast); + tensor x_293_mode_0 = const()[name = tensor("x_293_mode_0"), val = tensor("EXACT")]; + tensor x_293_cast = gelu(mode = x_293_mode_0, x = input_193_cast); + tensor var_2663_to_fp16 = const()[name = tensor("op_2663_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(606112000)))]; + tensor var_2664_to_fp16 = const()[name = tensor("op_2664_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614500672)))]; + tensor var_2665_cast = linear(bias = var_2664_to_fp16, weight = var_2663_to_fp16, x = x_293_cast); + tensor x_cast = add(x = x_289_cast, y = var_2665_cast); + tensor var_2678_axes_0 = const()[name = tensor("op_2678_axes_0"), val = tensor([-1])]; + tensor ln_post_weight_to_fp16 = const()[name = tensor("ln_post_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614502784)))]; + tensor ln_post_bias_to_fp16 = const()[name = tensor("ln_post_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614504896)))]; + tensor var_2669_to_fp16 = const()[name = tensor("op_2669_to_fp16"), val = tensor(0x1.5p-17)]; + tensor var_2678_cast = layer_norm(axes = var_2678_axes_0, beta = ln_post_bias_to_fp16, epsilon = var_2669_to_fp16, gamma = ln_post_weight_to_fp16, x = x_cast); + tensor var_2678_cast_to_fp32_dtype_0 = const()[name = tensor("op_2678_cast_to_fp32_dtype_0"), val = tensor("fp32")]; + tensor output = cast(dtype = var_2678_cast_to_fp32_dtype_0, x = var_2678_cast); + } -> (output); +} \ No newline at end of file