program(1.0) [buildInfo = dict, tensor>({{"coremlc-component-MIL", "4.28.4"}, {"coremlc-version", "1436.100.10"}})] { func main(tensor logmel_data) { tensor var_56 = const()[name = tensor("op_56"), val = tensor(1)]; tensor var_64 = const()[name = tensor("op_64"), val = tensor([1])]; tensor var_66 = const()[name = tensor("op_66"), val = tensor([1])]; tensor var_68_pad_type_0 = const()[name = tensor("op_68_pad_type_0"), val = tensor("custom")]; tensor var_68_pad_0 = const()[name = tensor("op_68_pad_0"), val = tensor([1, 1])]; tensor logmel_data_to_fp16_dtype_0 = const()[name = tensor("logmel_data_to_fp16_dtype_0"), val = tensor("fp16")]; tensor weight_3_to_fp16 = const()[name = tensor("weight_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64)))]; tensor bias_3_to_fp16 = const()[name = tensor("bias_3_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(491648)))]; tensor cast_727 = cast(dtype = logmel_data_to_fp16_dtype_0, x = logmel_data); tensor var_68_cast = conv(bias = bias_3_to_fp16, dilations = var_66, groups = var_56, pad = var_68_pad_0, pad_type = var_68_pad_type_0, strides = var_64, weight = weight_3_to_fp16, x = cast_727); tensor input_1_mode_0 = const()[name = tensor("input_1_mode_0"), val = tensor("EXACT")]; tensor input_1_cast = gelu(mode = input_1_mode_0, x = var_68_cast); tensor var_72 = const()[name = tensor("op_72"), val = tensor(1)]; tensor var_81 = const()[name = tensor("op_81"), val = tensor([2])]; tensor var_83 = const()[name = tensor("op_83"), val = tensor([1])]; tensor var_85_pad_type_0 = const()[name = tensor("op_85_pad_type_0"), val = tensor("custom")]; tensor var_85_pad_0 = const()[name = tensor("op_85_pad_0"), val = tensor([1, 1])]; tensor weight_7_to_fp16 = const()[name = tensor("weight_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(493760)))]; tensor bias_7_to_fp16 = const()[name = tensor("bias_7_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6785280)))]; tensor var_85_cast = conv(bias = bias_7_to_fp16, dilations = var_83, groups = var_72, pad = var_85_pad_0, pad_type = var_85_pad_type_0, strides = var_81, weight = weight_7_to_fp16, x = input_1_cast); tensor x_3_mode_0 = const()[name = tensor("x_3_mode_0"), val = tensor("EXACT")]; tensor x_3_cast = gelu(mode = x_3_mode_0, x = var_85_cast); tensor var_90 = const()[name = tensor("op_90"), val = tensor([0, 2, 1])]; tensor positional_embedding_to_fp16 = const()[name = tensor("positional_embedding_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(6787392)))]; tensor transpose_192 = transpose(perm = var_90, x = x_3_cast); tensor var_93_cast = add(x = transpose_192, y = positional_embedding_to_fp16); tensor var_106 = const()[name = tensor("op_106"), val = tensor(-1)]; tensor var_123_axes_0 = const()[name = tensor("op_123_axes_0"), val = tensor([-1])]; tensor blocks_0_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_0_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9859456)))]; tensor blocks_0_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_0_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9861568)))]; tensor var_112_to_fp16 = const()[name = tensor("op_112_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_123_cast = layer_norm(axes = var_123_axes_0, beta = blocks_0_attn_ln_bias_to_fp16, epsilon = var_112_to_fp16, gamma = blocks_0_attn_ln_weight_to_fp16, x = var_93_cast); tensor var_134_to_fp16 = const()[name = tensor("op_134_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(9863680)))]; tensor var_135_to_fp16 = const()[name = tensor("op_135_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11960896)))]; tensor q_1_cast = linear(bias = var_135_to_fp16, weight = var_134_to_fp16, x = var_123_cast); tensor var_138_to_fp16 = const()[name = tensor("op_138_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(11963008)))]; tensor k_1_bias_0_to_fp16 = const()[name = tensor("k_1_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14060224)))]; tensor k_1_cast = linear(bias = k_1_bias_0_to_fp16, weight = var_138_to_fp16, x = var_123_cast); tensor var_142_to_fp16 = const()[name = tensor("op_142_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(14062336)))]; tensor var_143_to_fp16 = const()[name = tensor("op_143_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16159552)))]; tensor v_1_cast = linear(bias = var_143_to_fp16, weight = var_142_to_fp16, x = var_123_cast); tensor var_151 = const()[name = tensor("op_151"), val = tensor([1, 1500, 16, -1])]; tensor var_152_cast = reshape(shape = var_151, x = q_1_cast); tensor const_168_to_fp16 = const()[name = tensor("const_168_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_3_cast = mul(x = var_152_cast, y = const_168_to_fp16); tensor var_158 = const()[name = tensor("op_158"), val = tensor([1, 1500, 16, -1])]; tensor var_159_cast = reshape(shape = var_158, x = k_1_cast); tensor const_169_to_fp16 = const()[name = tensor("const_169_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_3_cast = mul(x = var_159_cast, y = const_169_to_fp16); tensor var_165 = const()[name = tensor("op_165"), val = tensor([1, 1500, 16, -1])]; tensor var_166_cast = reshape(shape = var_165, x = v_1_cast); tensor var_167 = const()[name = tensor("op_167"), val = tensor([0, 2, 1, 3])]; tensor qk_1_transpose_x_0 = const()[name = tensor("qk_1_transpose_x_0"), val = tensor(false)]; tensor qk_1_transpose_y_0 = const()[name = tensor("qk_1_transpose_y_0"), val = tensor(false)]; tensor transpose_48_perm_0 = const()[name = tensor("transpose_48_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_49_perm_0 = const()[name = tensor("transpose_49_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_189 = transpose(perm = transpose_49_perm_0, x = k_3_cast); tensor transpose_190 = transpose(perm = transpose_48_perm_0, x = q_3_cast); tensor qk_1_cast = matmul(transpose_x = qk_1_transpose_x_0, transpose_y = qk_1_transpose_y_0, x = transpose_190, y = transpose_189); tensor var_171_cast = softmax(axis = var_106, x = qk_1_cast); tensor var_173_transpose_x_0 = const()[name = tensor("op_173_transpose_x_0"), val = tensor(false)]; tensor var_173_transpose_y_0 = const()[name = tensor("op_173_transpose_y_0"), val = tensor(false)]; tensor transpose_191 = transpose(perm = var_167, x = var_166_cast); tensor var_173_cast = matmul(transpose_x = var_173_transpose_x_0, transpose_y = var_173_transpose_y_0, x = var_171_cast, y = transpose_191); tensor var_174 = const()[name = tensor("op_174"), val = tensor([0, 2, 1, 3])]; tensor concat_0 = const()[name = tensor("concat_0"), val = tensor([1, 1500, 1024])]; tensor transpose_188 = transpose(perm = var_174, x = var_173_cast); tensor x_11_cast = reshape(shape = concat_0, x = transpose_188); tensor var_179_to_fp16 = const()[name = tensor("op_179_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(16161664)))]; tensor var_180_to_fp16 = const()[name = tensor("op_180_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18258880)))]; tensor var_181_cast = linear(bias = var_180_to_fp16, weight = var_179_to_fp16, x = x_11_cast); tensor x_13_cast = add(x = var_93_cast, y = var_181_cast); tensor var_187_axes_0 = const()[name = tensor("op_187_axes_0"), val = tensor([-1])]; tensor blocks_0_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18260992)))]; tensor blocks_0_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_0_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18263104)))]; tensor var_187_cast = layer_norm(axes = var_187_axes_0, beta = blocks_0_mlp_ln_bias_to_fp16, epsilon = var_112_to_fp16, gamma = blocks_0_mlp_ln_weight_to_fp16, x = x_13_cast); tensor var_196_to_fp16 = const()[name = tensor("op_196_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(18265216)))]; tensor var_197_to_fp16 = const()[name = tensor("op_197_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26653888)))]; tensor input_9_cast = linear(bias = var_197_to_fp16, weight = var_196_to_fp16, x = var_187_cast); tensor x_17_mode_0 = const()[name = tensor("x_17_mode_0"), val = tensor("EXACT")]; tensor x_17_cast = gelu(mode = x_17_mode_0, x = input_9_cast); tensor var_202_to_fp16 = const()[name = tensor("op_202_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(26662144)))]; tensor var_203_to_fp16 = const()[name = tensor("op_203_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35050816)))]; tensor var_204_cast = linear(bias = var_203_to_fp16, weight = var_202_to_fp16, x = x_17_cast); tensor x_19_cast = add(x = x_13_cast, y = var_204_cast); tensor var_213 = const()[name = tensor("op_213"), val = tensor(-1)]; tensor var_230_axes_0 = const()[name = tensor("op_230_axes_0"), val = tensor([-1])]; tensor blocks_1_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_1_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35052928)))]; tensor blocks_1_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_1_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35055040)))]; tensor var_219_to_fp16 = const()[name = tensor("op_219_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_230_cast = layer_norm(axes = var_230_axes_0, beta = blocks_1_attn_ln_bias_to_fp16, epsilon = var_219_to_fp16, gamma = blocks_1_attn_ln_weight_to_fp16, x = x_19_cast); tensor var_241_to_fp16 = const()[name = tensor("op_241_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(35057152)))]; tensor var_242_to_fp16 = const()[name = tensor("op_242_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37154368)))]; tensor q_5_cast = linear(bias = var_242_to_fp16, weight = var_241_to_fp16, x = var_230_cast); tensor var_245_to_fp16 = const()[name = tensor("op_245_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(37156480)))]; tensor k_5_bias_0_to_fp16 = const()[name = tensor("k_5_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39253696)))]; tensor k_5_cast = linear(bias = k_5_bias_0_to_fp16, weight = var_245_to_fp16, x = var_230_cast); tensor var_249_to_fp16 = const()[name = tensor("op_249_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(39255808)))]; tensor var_250_to_fp16 = const()[name = tensor("op_250_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41353024)))]; tensor v_5_cast = linear(bias = var_250_to_fp16, weight = var_249_to_fp16, x = var_230_cast); tensor var_258 = const()[name = tensor("op_258"), val = tensor([1, 1500, 16, -1])]; tensor var_259_cast = reshape(shape = var_258, x = q_5_cast); tensor const_170_to_fp16 = const()[name = tensor("const_170_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_7_cast = mul(x = var_259_cast, y = const_170_to_fp16); tensor var_265 = const()[name = tensor("op_265"), val = tensor([1, 1500, 16, -1])]; tensor var_266_cast = reshape(shape = var_265, x = k_5_cast); tensor const_171_to_fp16 = const()[name = tensor("const_171_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_7_cast = mul(x = var_266_cast, y = const_171_to_fp16); tensor var_272 = const()[name = tensor("op_272"), val = tensor([1, 1500, 16, -1])]; tensor var_273_cast = reshape(shape = var_272, x = v_5_cast); tensor var_274 = const()[name = tensor("op_274"), val = tensor([0, 2, 1, 3])]; tensor qk_3_transpose_x_0 = const()[name = tensor("qk_3_transpose_x_0"), val = tensor(false)]; tensor qk_3_transpose_y_0 = const()[name = tensor("qk_3_transpose_y_0"), val = tensor(false)]; tensor transpose_50_perm_0 = const()[name = tensor("transpose_50_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_51_perm_0 = const()[name = tensor("transpose_51_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_185 = transpose(perm = transpose_51_perm_0, x = k_7_cast); tensor transpose_186 = transpose(perm = transpose_50_perm_0, x = q_7_cast); tensor qk_3_cast = matmul(transpose_x = qk_3_transpose_x_0, transpose_y = qk_3_transpose_y_0, x = transpose_186, y = transpose_185); tensor var_278_cast = softmax(axis = var_213, x = qk_3_cast); tensor var_280_transpose_x_0 = const()[name = tensor("op_280_transpose_x_0"), val = tensor(false)]; tensor var_280_transpose_y_0 = const()[name = tensor("op_280_transpose_y_0"), val = tensor(false)]; tensor transpose_187 = transpose(perm = var_274, x = var_273_cast); tensor var_280_cast = matmul(transpose_x = var_280_transpose_x_0, transpose_y = var_280_transpose_y_0, x = var_278_cast, y = transpose_187); tensor var_281 = const()[name = tensor("op_281"), val = tensor([0, 2, 1, 3])]; tensor concat_1 = const()[name = tensor("concat_1"), val = tensor([1, 1500, 1024])]; tensor transpose_184 = transpose(perm = var_281, x = var_280_cast); tensor x_23_cast = reshape(shape = concat_1, x = transpose_184); tensor var_286_to_fp16 = const()[name = tensor("op_286_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(41355136)))]; tensor var_287_to_fp16 = const()[name = tensor("op_287_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43452352)))]; tensor var_288_cast = linear(bias = var_287_to_fp16, weight = var_286_to_fp16, x = x_23_cast); tensor x_25_cast = add(x = x_19_cast, y = var_288_cast); tensor var_294_axes_0 = const()[name = tensor("op_294_axes_0"), val = tensor([-1])]; tensor blocks_1_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43454464)))]; tensor blocks_1_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_1_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43456576)))]; tensor var_294_cast = layer_norm(axes = var_294_axes_0, beta = blocks_1_mlp_ln_bias_to_fp16, epsilon = var_219_to_fp16, gamma = blocks_1_mlp_ln_weight_to_fp16, x = x_25_cast); tensor var_303_to_fp16 = const()[name = tensor("op_303_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(43458688)))]; tensor var_304_to_fp16 = const()[name = tensor("op_304_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(51847360)))]; tensor input_17_cast = linear(bias = var_304_to_fp16, weight = var_303_to_fp16, x = var_294_cast); tensor x_29_mode_0 = const()[name = tensor("x_29_mode_0"), val = tensor("EXACT")]; tensor x_29_cast = gelu(mode = x_29_mode_0, x = input_17_cast); tensor var_309_to_fp16 = const()[name = tensor("op_309_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(51855616)))]; tensor var_310_to_fp16 = const()[name = tensor("op_310_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60244288)))]; tensor var_311_cast = linear(bias = var_310_to_fp16, weight = var_309_to_fp16, x = x_29_cast); tensor x_31_cast = add(x = x_25_cast, y = var_311_cast); tensor var_320 = const()[name = tensor("op_320"), val = tensor(-1)]; tensor var_337_axes_0 = const()[name = tensor("op_337_axes_0"), val = tensor([-1])]; tensor blocks_2_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_2_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60246400)))]; tensor blocks_2_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_2_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60248512)))]; tensor var_326_to_fp16 = const()[name = tensor("op_326_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_337_cast = layer_norm(axes = var_337_axes_0, beta = blocks_2_attn_ln_bias_to_fp16, epsilon = var_326_to_fp16, gamma = blocks_2_attn_ln_weight_to_fp16, x = x_31_cast); tensor var_348_to_fp16 = const()[name = tensor("op_348_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(60250624)))]; tensor var_349_to_fp16 = const()[name = tensor("op_349_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(62347840)))]; tensor q_9_cast = linear(bias = var_349_to_fp16, weight = var_348_to_fp16, x = var_337_cast); tensor var_352_to_fp16 = const()[name = tensor("op_352_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(62349952)))]; tensor k_9_bias_0_to_fp16 = const()[name = tensor("k_9_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64447168)))]; tensor k_9_cast = linear(bias = k_9_bias_0_to_fp16, weight = var_352_to_fp16, x = var_337_cast); tensor var_356_to_fp16 = const()[name = tensor("op_356_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(64449280)))]; tensor var_357_to_fp16 = const()[name = tensor("op_357_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(66546496)))]; tensor v_9_cast = linear(bias = var_357_to_fp16, weight = var_356_to_fp16, x = var_337_cast); tensor var_365 = const()[name = tensor("op_365"), val = tensor([1, 1500, 16, -1])]; tensor var_366_cast = reshape(shape = var_365, x = q_9_cast); tensor const_172_to_fp16 = const()[name = tensor("const_172_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_11_cast = mul(x = var_366_cast, y = const_172_to_fp16); tensor var_372 = const()[name = tensor("op_372"), val = tensor([1, 1500, 16, -1])]; tensor var_373_cast = reshape(shape = var_372, x = k_9_cast); tensor const_173_to_fp16 = const()[name = tensor("const_173_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_11_cast = mul(x = var_373_cast, y = const_173_to_fp16); tensor var_379 = const()[name = tensor("op_379"), val = tensor([1, 1500, 16, -1])]; tensor var_380_cast = reshape(shape = var_379, x = v_9_cast); tensor var_381 = const()[name = tensor("op_381"), val = tensor([0, 2, 1, 3])]; tensor qk_5_transpose_x_0 = const()[name = tensor("qk_5_transpose_x_0"), val = tensor(false)]; tensor qk_5_transpose_y_0 = const()[name = tensor("qk_5_transpose_y_0"), val = tensor(false)]; tensor transpose_52_perm_0 = const()[name = tensor("transpose_52_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_53_perm_0 = const()[name = tensor("transpose_53_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_181 = transpose(perm = transpose_53_perm_0, x = k_11_cast); tensor transpose_182 = transpose(perm = transpose_52_perm_0, x = q_11_cast); tensor qk_5_cast = matmul(transpose_x = qk_5_transpose_x_0, transpose_y = qk_5_transpose_y_0, x = transpose_182, y = transpose_181); tensor var_385_cast = softmax(axis = var_320, x = qk_5_cast); tensor var_387_transpose_x_0 = const()[name = tensor("op_387_transpose_x_0"), val = tensor(false)]; tensor var_387_transpose_y_0 = const()[name = tensor("op_387_transpose_y_0"), val = tensor(false)]; tensor transpose_183 = transpose(perm = var_381, x = var_380_cast); tensor var_387_cast = matmul(transpose_x = var_387_transpose_x_0, transpose_y = var_387_transpose_y_0, x = var_385_cast, y = transpose_183); tensor var_388 = const()[name = tensor("op_388"), val = tensor([0, 2, 1, 3])]; tensor concat_2 = const()[name = tensor("concat_2"), val = tensor([1, 1500, 1024])]; tensor transpose_180 = transpose(perm = var_388, x = var_387_cast); tensor x_35_cast = reshape(shape = concat_2, x = transpose_180); tensor var_393_to_fp16 = const()[name = tensor("op_393_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(66548608)))]; tensor var_394_to_fp16 = const()[name = tensor("op_394_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68645824)))]; tensor var_395_cast = linear(bias = var_394_to_fp16, weight = var_393_to_fp16, x = x_35_cast); tensor x_37_cast = add(x = x_31_cast, y = var_395_cast); tensor var_401_axes_0 = const()[name = tensor("op_401_axes_0"), val = tensor([-1])]; tensor blocks_2_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68647936)))]; tensor blocks_2_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_2_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68650048)))]; tensor var_401_cast = layer_norm(axes = var_401_axes_0, beta = blocks_2_mlp_ln_bias_to_fp16, epsilon = var_326_to_fp16, gamma = blocks_2_mlp_ln_weight_to_fp16, x = x_37_cast); tensor var_410_to_fp16 = const()[name = tensor("op_410_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(68652160)))]; tensor var_411_to_fp16 = const()[name = tensor("op_411_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(77040832)))]; tensor input_25_cast = linear(bias = var_411_to_fp16, weight = var_410_to_fp16, x = var_401_cast); tensor x_41_mode_0 = const()[name = tensor("x_41_mode_0"), val = tensor("EXACT")]; tensor x_41_cast = gelu(mode = x_41_mode_0, x = input_25_cast); tensor var_416_to_fp16 = const()[name = tensor("op_416_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(77049088)))]; tensor var_417_to_fp16 = const()[name = tensor("op_417_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85437760)))]; tensor var_418_cast = linear(bias = var_417_to_fp16, weight = var_416_to_fp16, x = x_41_cast); tensor x_43_cast = add(x = x_37_cast, y = var_418_cast); tensor var_427 = const()[name = tensor("op_427"), val = tensor(-1)]; tensor var_444_axes_0 = const()[name = tensor("op_444_axes_0"), val = tensor([-1])]; tensor blocks_3_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_3_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85439872)))]; tensor blocks_3_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_3_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85441984)))]; tensor var_433_to_fp16 = const()[name = tensor("op_433_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_444_cast = layer_norm(axes = var_444_axes_0, beta = blocks_3_attn_ln_bias_to_fp16, epsilon = var_433_to_fp16, gamma = blocks_3_attn_ln_weight_to_fp16, x = x_43_cast); tensor var_455_to_fp16 = const()[name = tensor("op_455_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(85444096)))]; tensor var_456_to_fp16 = const()[name = tensor("op_456_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(87541312)))]; tensor q_13_cast = linear(bias = var_456_to_fp16, weight = var_455_to_fp16, x = var_444_cast); tensor var_459_to_fp16 = const()[name = tensor("op_459_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(87543424)))]; tensor k_13_bias_0_to_fp16 = const()[name = tensor("k_13_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89640640)))]; tensor k_13_cast = linear(bias = k_13_bias_0_to_fp16, weight = var_459_to_fp16, x = var_444_cast); tensor var_463_to_fp16 = const()[name = tensor("op_463_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(89642752)))]; tensor var_464_to_fp16 = const()[name = tensor("op_464_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(91739968)))]; tensor v_13_cast = linear(bias = var_464_to_fp16, weight = var_463_to_fp16, x = var_444_cast); tensor var_472 = const()[name = tensor("op_472"), val = tensor([1, 1500, 16, -1])]; tensor var_473_cast = reshape(shape = var_472, x = q_13_cast); tensor const_174_to_fp16 = const()[name = tensor("const_174_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_15_cast = mul(x = var_473_cast, y = const_174_to_fp16); tensor var_479 = const()[name = tensor("op_479"), val = tensor([1, 1500, 16, -1])]; tensor var_480_cast = reshape(shape = var_479, x = k_13_cast); tensor const_175_to_fp16 = const()[name = tensor("const_175_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_15_cast = mul(x = var_480_cast, y = const_175_to_fp16); tensor var_486 = const()[name = tensor("op_486"), val = tensor([1, 1500, 16, -1])]; tensor var_487_cast = reshape(shape = var_486, x = v_13_cast); tensor var_488 = const()[name = tensor("op_488"), val = tensor([0, 2, 1, 3])]; tensor qk_7_transpose_x_0 = const()[name = tensor("qk_7_transpose_x_0"), val = tensor(false)]; tensor qk_7_transpose_y_0 = const()[name = tensor("qk_7_transpose_y_0"), val = tensor(false)]; tensor transpose_54_perm_0 = const()[name = tensor("transpose_54_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_55_perm_0 = const()[name = tensor("transpose_55_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_177 = transpose(perm = transpose_55_perm_0, x = k_15_cast); tensor transpose_178 = transpose(perm = transpose_54_perm_0, x = q_15_cast); tensor qk_7_cast = matmul(transpose_x = qk_7_transpose_x_0, transpose_y = qk_7_transpose_y_0, x = transpose_178, y = transpose_177); tensor var_492_cast = softmax(axis = var_427, x = qk_7_cast); tensor var_494_transpose_x_0 = const()[name = tensor("op_494_transpose_x_0"), val = tensor(false)]; tensor var_494_transpose_y_0 = const()[name = tensor("op_494_transpose_y_0"), val = tensor(false)]; tensor transpose_179 = transpose(perm = var_488, x = var_487_cast); tensor var_494_cast = matmul(transpose_x = var_494_transpose_x_0, transpose_y = var_494_transpose_y_0, x = var_492_cast, y = transpose_179); tensor var_495 = const()[name = tensor("op_495"), val = tensor([0, 2, 1, 3])]; tensor concat_3 = const()[name = tensor("concat_3"), val = tensor([1, 1500, 1024])]; tensor transpose_176 = transpose(perm = var_495, x = var_494_cast); tensor x_47_cast = reshape(shape = concat_3, x = transpose_176); tensor var_500_to_fp16 = const()[name = tensor("op_500_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(91742080)))]; tensor var_501_to_fp16 = const()[name = tensor("op_501_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93839296)))]; tensor var_502_cast = linear(bias = var_501_to_fp16, weight = var_500_to_fp16, x = x_47_cast); tensor x_49_cast = add(x = x_43_cast, y = var_502_cast); tensor var_508_axes_0 = const()[name = tensor("op_508_axes_0"), val = tensor([-1])]; tensor blocks_3_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93841408)))]; tensor blocks_3_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_3_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93843520)))]; tensor var_508_cast = layer_norm(axes = var_508_axes_0, beta = blocks_3_mlp_ln_bias_to_fp16, epsilon = var_433_to_fp16, gamma = blocks_3_mlp_ln_weight_to_fp16, x = x_49_cast); tensor var_517_to_fp16 = const()[name = tensor("op_517_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(93845632)))]; tensor var_518_to_fp16 = const()[name = tensor("op_518_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102234304)))]; tensor input_33_cast = linear(bias = var_518_to_fp16, weight = var_517_to_fp16, x = var_508_cast); tensor x_53_mode_0 = const()[name = tensor("x_53_mode_0"), val = tensor("EXACT")]; tensor x_53_cast = gelu(mode = x_53_mode_0, x = input_33_cast); tensor var_523_to_fp16 = const()[name = tensor("op_523_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(102242560)))]; tensor var_524_to_fp16 = const()[name = tensor("op_524_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110631232)))]; tensor var_525_cast = linear(bias = var_524_to_fp16, weight = var_523_to_fp16, x = x_53_cast); tensor x_55_cast = add(x = x_49_cast, y = var_525_cast); tensor var_534 = const()[name = tensor("op_534"), val = tensor(-1)]; tensor var_551_axes_0 = const()[name = tensor("op_551_axes_0"), val = tensor([-1])]; tensor blocks_4_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_4_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110633344)))]; tensor blocks_4_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_4_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110635456)))]; tensor var_540_to_fp16 = const()[name = tensor("op_540_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_551_cast = layer_norm(axes = var_551_axes_0, beta = blocks_4_attn_ln_bias_to_fp16, epsilon = var_540_to_fp16, gamma = blocks_4_attn_ln_weight_to_fp16, x = x_55_cast); tensor var_562_to_fp16 = const()[name = tensor("op_562_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(110637568)))]; tensor var_563_to_fp16 = const()[name = tensor("op_563_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(112734784)))]; tensor q_17_cast = linear(bias = var_563_to_fp16, weight = var_562_to_fp16, x = var_551_cast); tensor var_566_to_fp16 = const()[name = tensor("op_566_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(112736896)))]; tensor k_17_bias_0_to_fp16 = const()[name = tensor("k_17_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114834112)))]; tensor k_17_cast = linear(bias = k_17_bias_0_to_fp16, weight = var_566_to_fp16, x = var_551_cast); tensor var_570_to_fp16 = const()[name = tensor("op_570_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(114836224)))]; tensor var_571_to_fp16 = const()[name = tensor("op_571_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(116933440)))]; tensor v_17_cast = linear(bias = var_571_to_fp16, weight = var_570_to_fp16, x = var_551_cast); tensor var_579 = const()[name = tensor("op_579"), val = tensor([1, 1500, 16, -1])]; tensor var_580_cast = reshape(shape = var_579, x = q_17_cast); tensor const_176_to_fp16 = const()[name = tensor("const_176_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_19_cast = mul(x = var_580_cast, y = const_176_to_fp16); tensor var_586 = const()[name = tensor("op_586"), val = tensor([1, 1500, 16, -1])]; tensor var_587_cast = reshape(shape = var_586, x = k_17_cast); tensor const_177_to_fp16 = const()[name = tensor("const_177_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_19_cast = mul(x = var_587_cast, y = const_177_to_fp16); tensor var_593 = const()[name = tensor("op_593"), val = tensor([1, 1500, 16, -1])]; tensor var_594_cast = reshape(shape = var_593, x = v_17_cast); tensor var_595 = const()[name = tensor("op_595"), val = tensor([0, 2, 1, 3])]; tensor qk_9_transpose_x_0 = const()[name = tensor("qk_9_transpose_x_0"), val = tensor(false)]; tensor qk_9_transpose_y_0 = const()[name = tensor("qk_9_transpose_y_0"), val = tensor(false)]; tensor transpose_56_perm_0 = const()[name = tensor("transpose_56_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_57_perm_0 = const()[name = tensor("transpose_57_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_173 = transpose(perm = transpose_57_perm_0, x = k_19_cast); tensor transpose_174 = transpose(perm = transpose_56_perm_0, x = q_19_cast); tensor qk_9_cast = matmul(transpose_x = qk_9_transpose_x_0, transpose_y = qk_9_transpose_y_0, x = transpose_174, y = transpose_173); tensor var_599_cast = softmax(axis = var_534, x = qk_9_cast); tensor var_601_transpose_x_0 = const()[name = tensor("op_601_transpose_x_0"), val = tensor(false)]; tensor var_601_transpose_y_0 = const()[name = tensor("op_601_transpose_y_0"), val = tensor(false)]; tensor transpose_175 = transpose(perm = var_595, x = var_594_cast); tensor var_601_cast = matmul(transpose_x = var_601_transpose_x_0, transpose_y = var_601_transpose_y_0, x = var_599_cast, y = transpose_175); tensor var_602 = const()[name = tensor("op_602"), val = tensor([0, 2, 1, 3])]; tensor concat_4 = const()[name = tensor("concat_4"), val = tensor([1, 1500, 1024])]; tensor transpose_172 = transpose(perm = var_602, x = var_601_cast); tensor x_59_cast = reshape(shape = concat_4, x = transpose_172); tensor var_607_to_fp16 = const()[name = tensor("op_607_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(116935552)))]; tensor var_608_to_fp16 = const()[name = tensor("op_608_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119032768)))]; tensor var_609_cast = linear(bias = var_608_to_fp16, weight = var_607_to_fp16, x = x_59_cast); tensor x_61_cast = add(x = x_55_cast, y = var_609_cast); tensor var_615_axes_0 = const()[name = tensor("op_615_axes_0"), val = tensor([-1])]; tensor blocks_4_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119034880)))]; tensor blocks_4_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_4_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119036992)))]; tensor var_615_cast = layer_norm(axes = var_615_axes_0, beta = blocks_4_mlp_ln_bias_to_fp16, epsilon = var_540_to_fp16, gamma = blocks_4_mlp_ln_weight_to_fp16, x = x_61_cast); tensor var_624_to_fp16 = const()[name = tensor("op_624_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(119039104)))]; tensor var_625_to_fp16 = const()[name = tensor("op_625_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127427776)))]; tensor input_41_cast = linear(bias = var_625_to_fp16, weight = var_624_to_fp16, x = var_615_cast); tensor x_65_mode_0 = const()[name = tensor("x_65_mode_0"), val = tensor("EXACT")]; tensor x_65_cast = gelu(mode = x_65_mode_0, x = input_41_cast); tensor var_630_to_fp16 = const()[name = tensor("op_630_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(127436032)))]; tensor var_631_to_fp16 = const()[name = tensor("op_631_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135824704)))]; tensor var_632_cast = linear(bias = var_631_to_fp16, weight = var_630_to_fp16, x = x_65_cast); tensor x_67_cast = add(x = x_61_cast, y = var_632_cast); tensor var_641 = const()[name = tensor("op_641"), val = tensor(-1)]; tensor var_658_axes_0 = const()[name = tensor("op_658_axes_0"), val = tensor([-1])]; tensor blocks_5_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_5_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135826816)))]; tensor blocks_5_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_5_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135828928)))]; tensor var_647_to_fp16 = const()[name = tensor("op_647_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_658_cast = layer_norm(axes = var_658_axes_0, beta = blocks_5_attn_ln_bias_to_fp16, epsilon = var_647_to_fp16, gamma = blocks_5_attn_ln_weight_to_fp16, x = x_67_cast); tensor var_669_to_fp16 = const()[name = tensor("op_669_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(135831040)))]; tensor var_670_to_fp16 = const()[name = tensor("op_670_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(137928256)))]; tensor q_21_cast = linear(bias = var_670_to_fp16, weight = var_669_to_fp16, x = var_658_cast); tensor var_673_to_fp16 = const()[name = tensor("op_673_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(137930368)))]; tensor k_21_bias_0_to_fp16 = const()[name = tensor("k_21_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140027584)))]; tensor k_21_cast = linear(bias = k_21_bias_0_to_fp16, weight = var_673_to_fp16, x = var_658_cast); tensor var_677_to_fp16 = const()[name = tensor("op_677_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(140029696)))]; tensor var_678_to_fp16 = const()[name = tensor("op_678_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142126912)))]; tensor v_21_cast = linear(bias = var_678_to_fp16, weight = var_677_to_fp16, x = var_658_cast); tensor var_686 = const()[name = tensor("op_686"), val = tensor([1, 1500, 16, -1])]; tensor var_687_cast = reshape(shape = var_686, x = q_21_cast); tensor const_178_to_fp16 = const()[name = tensor("const_178_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_23_cast = mul(x = var_687_cast, y = const_178_to_fp16); tensor var_693 = const()[name = tensor("op_693"), val = tensor([1, 1500, 16, -1])]; tensor var_694_cast = reshape(shape = var_693, x = k_21_cast); tensor const_179_to_fp16 = const()[name = tensor("const_179_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_23_cast = mul(x = var_694_cast, y = const_179_to_fp16); tensor var_700 = const()[name = tensor("op_700"), val = tensor([1, 1500, 16, -1])]; tensor var_701_cast = reshape(shape = var_700, x = v_21_cast); tensor var_702 = const()[name = tensor("op_702"), val = tensor([0, 2, 1, 3])]; tensor qk_11_transpose_x_0 = const()[name = tensor("qk_11_transpose_x_0"), val = tensor(false)]; tensor qk_11_transpose_y_0 = const()[name = tensor("qk_11_transpose_y_0"), val = tensor(false)]; tensor transpose_58_perm_0 = const()[name = tensor("transpose_58_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_59_perm_0 = const()[name = tensor("transpose_59_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_169 = transpose(perm = transpose_59_perm_0, x = k_23_cast); tensor transpose_170 = transpose(perm = transpose_58_perm_0, x = q_23_cast); tensor qk_11_cast = matmul(transpose_x = qk_11_transpose_x_0, transpose_y = qk_11_transpose_y_0, x = transpose_170, y = transpose_169); tensor var_706_cast = softmax(axis = var_641, x = qk_11_cast); tensor var_708_transpose_x_0 = const()[name = tensor("op_708_transpose_x_0"), val = tensor(false)]; tensor var_708_transpose_y_0 = const()[name = tensor("op_708_transpose_y_0"), val = tensor(false)]; tensor transpose_171 = transpose(perm = var_702, x = var_701_cast); tensor var_708_cast = matmul(transpose_x = var_708_transpose_x_0, transpose_y = var_708_transpose_y_0, x = var_706_cast, y = transpose_171); tensor var_709 = const()[name = tensor("op_709"), val = tensor([0, 2, 1, 3])]; tensor concat_5 = const()[name = tensor("concat_5"), val = tensor([1, 1500, 1024])]; tensor transpose_168 = transpose(perm = var_709, x = var_708_cast); tensor x_71_cast = reshape(shape = concat_5, x = transpose_168); tensor var_714_to_fp16 = const()[name = tensor("op_714_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(142129024)))]; tensor var_715_to_fp16 = const()[name = tensor("op_715_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144226240)))]; tensor var_716_cast = linear(bias = var_715_to_fp16, weight = var_714_to_fp16, x = x_71_cast); tensor x_73_cast = add(x = x_67_cast, y = var_716_cast); tensor var_722_axes_0 = const()[name = tensor("op_722_axes_0"), val = tensor([-1])]; tensor blocks_5_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144228352)))]; tensor blocks_5_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_5_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144230464)))]; tensor var_722_cast = layer_norm(axes = var_722_axes_0, beta = blocks_5_mlp_ln_bias_to_fp16, epsilon = var_647_to_fp16, gamma = blocks_5_mlp_ln_weight_to_fp16, x = x_73_cast); tensor var_731_to_fp16 = const()[name = tensor("op_731_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(144232576)))]; tensor var_732_to_fp16 = const()[name = tensor("op_732_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(152621248)))]; tensor input_49_cast = linear(bias = var_732_to_fp16, weight = var_731_to_fp16, x = var_722_cast); tensor x_77_mode_0 = const()[name = tensor("x_77_mode_0"), val = tensor("EXACT")]; tensor x_77_cast = gelu(mode = x_77_mode_0, x = input_49_cast); tensor var_737_to_fp16 = const()[name = tensor("op_737_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(152629504)))]; tensor var_738_to_fp16 = const()[name = tensor("op_738_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(161018176)))]; tensor var_739_cast = linear(bias = var_738_to_fp16, weight = var_737_to_fp16, x = x_77_cast); tensor x_79_cast = add(x = x_73_cast, y = var_739_cast); tensor var_748 = const()[name = tensor("op_748"), val = tensor(-1)]; tensor var_765_axes_0 = const()[name = tensor("op_765_axes_0"), val = tensor([-1])]; tensor blocks_6_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_6_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(161020288)))]; tensor blocks_6_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_6_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(161022400)))]; tensor var_754_to_fp16 = const()[name = tensor("op_754_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_765_cast = layer_norm(axes = var_765_axes_0, beta = blocks_6_attn_ln_bias_to_fp16, epsilon = var_754_to_fp16, gamma = blocks_6_attn_ln_weight_to_fp16, x = x_79_cast); tensor var_776_to_fp16 = const()[name = tensor("op_776_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(161024512)))]; tensor var_777_to_fp16 = const()[name = tensor("op_777_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163121728)))]; tensor q_25_cast = linear(bias = var_777_to_fp16, weight = var_776_to_fp16, x = var_765_cast); tensor var_780_to_fp16 = const()[name = tensor("op_780_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(163123840)))]; tensor k_25_bias_0_to_fp16 = const()[name = tensor("k_25_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165221056)))]; tensor k_25_cast = linear(bias = k_25_bias_0_to_fp16, weight = var_780_to_fp16, x = var_765_cast); tensor var_784_to_fp16 = const()[name = tensor("op_784_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(165223168)))]; tensor var_785_to_fp16 = const()[name = tensor("op_785_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167320384)))]; tensor v_25_cast = linear(bias = var_785_to_fp16, weight = var_784_to_fp16, x = var_765_cast); tensor var_793 = const()[name = tensor("op_793"), val = tensor([1, 1500, 16, -1])]; tensor var_794_cast = reshape(shape = var_793, x = q_25_cast); tensor const_180_to_fp16 = const()[name = tensor("const_180_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_27_cast = mul(x = var_794_cast, y = const_180_to_fp16); tensor var_800 = const()[name = tensor("op_800"), val = tensor([1, 1500, 16, -1])]; tensor var_801_cast = reshape(shape = var_800, x = k_25_cast); tensor const_181_to_fp16 = const()[name = tensor("const_181_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_27_cast = mul(x = var_801_cast, y = const_181_to_fp16); tensor var_807 = const()[name = tensor("op_807"), val = tensor([1, 1500, 16, -1])]; tensor var_808_cast = reshape(shape = var_807, x = v_25_cast); tensor var_809 = const()[name = tensor("op_809"), val = tensor([0, 2, 1, 3])]; tensor qk_13_transpose_x_0 = const()[name = tensor("qk_13_transpose_x_0"), val = tensor(false)]; tensor qk_13_transpose_y_0 = const()[name = tensor("qk_13_transpose_y_0"), val = tensor(false)]; tensor transpose_60_perm_0 = const()[name = tensor("transpose_60_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_61_perm_0 = const()[name = tensor("transpose_61_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_165 = transpose(perm = transpose_61_perm_0, x = k_27_cast); tensor transpose_166 = transpose(perm = transpose_60_perm_0, x = q_27_cast); tensor qk_13_cast = matmul(transpose_x = qk_13_transpose_x_0, transpose_y = qk_13_transpose_y_0, x = transpose_166, y = transpose_165); tensor var_813_cast = softmax(axis = var_748, x = qk_13_cast); tensor var_815_transpose_x_0 = const()[name = tensor("op_815_transpose_x_0"), val = tensor(false)]; tensor var_815_transpose_y_0 = const()[name = tensor("op_815_transpose_y_0"), val = tensor(false)]; tensor transpose_167 = transpose(perm = var_809, x = var_808_cast); tensor var_815_cast = matmul(transpose_x = var_815_transpose_x_0, transpose_y = var_815_transpose_y_0, x = var_813_cast, y = transpose_167); tensor var_816 = const()[name = tensor("op_816"), val = tensor([0, 2, 1, 3])]; tensor concat_6 = const()[name = tensor("concat_6"), val = tensor([1, 1500, 1024])]; tensor transpose_164 = transpose(perm = var_816, x = var_815_cast); tensor x_83_cast = reshape(shape = concat_6, x = transpose_164); tensor var_821_to_fp16 = const()[name = tensor("op_821_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(167322496)))]; tensor var_822_to_fp16 = const()[name = tensor("op_822_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169419712)))]; tensor var_823_cast = linear(bias = var_822_to_fp16, weight = var_821_to_fp16, x = x_83_cast); tensor x_85_cast = add(x = x_79_cast, y = var_823_cast); tensor var_829_axes_0 = const()[name = tensor("op_829_axes_0"), val = tensor([-1])]; tensor blocks_6_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_6_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169421824)))]; tensor blocks_6_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_6_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169423936)))]; tensor var_829_cast = layer_norm(axes = var_829_axes_0, beta = blocks_6_mlp_ln_bias_to_fp16, epsilon = var_754_to_fp16, gamma = blocks_6_mlp_ln_weight_to_fp16, x = x_85_cast); tensor var_838_to_fp16 = const()[name = tensor("op_838_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(169426048)))]; tensor var_839_to_fp16 = const()[name = tensor("op_839_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177814720)))]; tensor input_57_cast = linear(bias = var_839_to_fp16, weight = var_838_to_fp16, x = var_829_cast); tensor x_89_mode_0 = const()[name = tensor("x_89_mode_0"), val = tensor("EXACT")]; tensor x_89_cast = gelu(mode = x_89_mode_0, x = input_57_cast); tensor var_844_to_fp16 = const()[name = tensor("op_844_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(177822976)))]; tensor var_845_to_fp16 = const()[name = tensor("op_845_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186211648)))]; tensor var_846_cast = linear(bias = var_845_to_fp16, weight = var_844_to_fp16, x = x_89_cast); tensor x_91_cast = add(x = x_85_cast, y = var_846_cast); tensor var_855 = const()[name = tensor("op_855"), val = tensor(-1)]; tensor var_872_axes_0 = const()[name = tensor("op_872_axes_0"), val = tensor([-1])]; tensor blocks_7_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_7_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186213760)))]; tensor blocks_7_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_7_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186215872)))]; tensor var_861_to_fp16 = const()[name = tensor("op_861_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_872_cast = layer_norm(axes = var_872_axes_0, beta = blocks_7_attn_ln_bias_to_fp16, epsilon = var_861_to_fp16, gamma = blocks_7_attn_ln_weight_to_fp16, x = x_91_cast); tensor var_883_to_fp16 = const()[name = tensor("op_883_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(186217984)))]; tensor var_884_to_fp16 = const()[name = tensor("op_884_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(188315200)))]; tensor q_29_cast = linear(bias = var_884_to_fp16, weight = var_883_to_fp16, x = var_872_cast); tensor var_887_to_fp16 = const()[name = tensor("op_887_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(188317312)))]; tensor k_29_bias_0_to_fp16 = const()[name = tensor("k_29_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190414528)))]; tensor k_29_cast = linear(bias = k_29_bias_0_to_fp16, weight = var_887_to_fp16, x = var_872_cast); tensor var_891_to_fp16 = const()[name = tensor("op_891_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(190416640)))]; tensor var_892_to_fp16 = const()[name = tensor("op_892_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192513856)))]; tensor v_29_cast = linear(bias = var_892_to_fp16, weight = var_891_to_fp16, x = var_872_cast); tensor var_900 = const()[name = tensor("op_900"), val = tensor([1, 1500, 16, -1])]; tensor var_901_cast = reshape(shape = var_900, x = q_29_cast); tensor const_182_to_fp16 = const()[name = tensor("const_182_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_31_cast = mul(x = var_901_cast, y = const_182_to_fp16); tensor var_907 = const()[name = tensor("op_907"), val = tensor([1, 1500, 16, -1])]; tensor var_908_cast = reshape(shape = var_907, x = k_29_cast); tensor const_183_to_fp16 = const()[name = tensor("const_183_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_31_cast = mul(x = var_908_cast, y = const_183_to_fp16); tensor var_914 = const()[name = tensor("op_914"), val = tensor([1, 1500, 16, -1])]; tensor var_915_cast = reshape(shape = var_914, x = v_29_cast); tensor var_916 = const()[name = tensor("op_916"), val = tensor([0, 2, 1, 3])]; tensor qk_15_transpose_x_0 = const()[name = tensor("qk_15_transpose_x_0"), val = tensor(false)]; tensor qk_15_transpose_y_0 = const()[name = tensor("qk_15_transpose_y_0"), val = tensor(false)]; tensor transpose_62_perm_0 = const()[name = tensor("transpose_62_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_63_perm_0 = const()[name = tensor("transpose_63_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_161 = transpose(perm = transpose_63_perm_0, x = k_31_cast); tensor transpose_162 = transpose(perm = transpose_62_perm_0, x = q_31_cast); tensor qk_15_cast = matmul(transpose_x = qk_15_transpose_x_0, transpose_y = qk_15_transpose_y_0, x = transpose_162, y = transpose_161); tensor var_920_cast = softmax(axis = var_855, x = qk_15_cast); tensor var_922_transpose_x_0 = const()[name = tensor("op_922_transpose_x_0"), val = tensor(false)]; tensor var_922_transpose_y_0 = const()[name = tensor("op_922_transpose_y_0"), val = tensor(false)]; tensor transpose_163 = transpose(perm = var_916, x = var_915_cast); tensor var_922_cast = matmul(transpose_x = var_922_transpose_x_0, transpose_y = var_922_transpose_y_0, x = var_920_cast, y = transpose_163); tensor var_923 = const()[name = tensor("op_923"), val = tensor([0, 2, 1, 3])]; tensor concat_7 = const()[name = tensor("concat_7"), val = tensor([1, 1500, 1024])]; tensor transpose_160 = transpose(perm = var_923, x = var_922_cast); tensor x_95_cast = reshape(shape = concat_7, x = transpose_160); tensor var_928_to_fp16 = const()[name = tensor("op_928_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(192515968)))]; tensor var_929_to_fp16 = const()[name = tensor("op_929_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194613184)))]; tensor var_930_cast = linear(bias = var_929_to_fp16, weight = var_928_to_fp16, x = x_95_cast); tensor x_97_cast = add(x = x_91_cast, y = var_930_cast); tensor var_936_axes_0 = const()[name = tensor("op_936_axes_0"), val = tensor([-1])]; tensor blocks_7_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_7_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194615296)))]; tensor blocks_7_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_7_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194617408)))]; tensor var_936_cast = layer_norm(axes = var_936_axes_0, beta = blocks_7_mlp_ln_bias_to_fp16, epsilon = var_861_to_fp16, gamma = blocks_7_mlp_ln_weight_to_fp16, x = x_97_cast); tensor var_945_to_fp16 = const()[name = tensor("op_945_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(194619520)))]; tensor var_946_to_fp16 = const()[name = tensor("op_946_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(203008192)))]; tensor input_65_cast = linear(bias = var_946_to_fp16, weight = var_945_to_fp16, x = var_936_cast); tensor x_101_mode_0 = const()[name = tensor("x_101_mode_0"), val = tensor("EXACT")]; tensor x_101_cast = gelu(mode = x_101_mode_0, x = input_65_cast); tensor var_951_to_fp16 = const()[name = tensor("op_951_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(203016448)))]; tensor var_952_to_fp16 = const()[name = tensor("op_952_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211405120)))]; tensor var_953_cast = linear(bias = var_952_to_fp16, weight = var_951_to_fp16, x = x_101_cast); tensor x_103_cast = add(x = x_97_cast, y = var_953_cast); tensor var_962 = const()[name = tensor("op_962"), val = tensor(-1)]; tensor var_979_axes_0 = const()[name = tensor("op_979_axes_0"), val = tensor([-1])]; tensor blocks_8_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_8_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211407232)))]; tensor blocks_8_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_8_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211409344)))]; tensor var_968_to_fp16 = const()[name = tensor("op_968_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_979_cast = layer_norm(axes = var_979_axes_0, beta = blocks_8_attn_ln_bias_to_fp16, epsilon = var_968_to_fp16, gamma = blocks_8_attn_ln_weight_to_fp16, x = x_103_cast); tensor var_990_to_fp16 = const()[name = tensor("op_990_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(211411456)))]; tensor var_991_to_fp16 = const()[name = tensor("op_991_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(213508672)))]; tensor q_33_cast = linear(bias = var_991_to_fp16, weight = var_990_to_fp16, x = var_979_cast); tensor var_994_to_fp16 = const()[name = tensor("op_994_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(213510784)))]; tensor k_33_bias_0_to_fp16 = const()[name = tensor("k_33_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215608000)))]; tensor k_33_cast = linear(bias = k_33_bias_0_to_fp16, weight = var_994_to_fp16, x = var_979_cast); tensor var_998_to_fp16 = const()[name = tensor("op_998_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(215610112)))]; tensor var_999_to_fp16 = const()[name = tensor("op_999_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217707328)))]; tensor v_33_cast = linear(bias = var_999_to_fp16, weight = var_998_to_fp16, x = var_979_cast); tensor var_1007 = const()[name = tensor("op_1007"), val = tensor([1, 1500, 16, -1])]; tensor var_1008_cast = reshape(shape = var_1007, x = q_33_cast); tensor const_184_to_fp16 = const()[name = tensor("const_184_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_35_cast = mul(x = var_1008_cast, y = const_184_to_fp16); tensor var_1014 = const()[name = tensor("op_1014"), val = tensor([1, 1500, 16, -1])]; tensor var_1015_cast = reshape(shape = var_1014, x = k_33_cast); tensor const_185_to_fp16 = const()[name = tensor("const_185_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_35_cast = mul(x = var_1015_cast, y = const_185_to_fp16); tensor var_1021 = const()[name = tensor("op_1021"), val = tensor([1, 1500, 16, -1])]; tensor var_1022_cast = reshape(shape = var_1021, x = v_33_cast); tensor var_1023 = const()[name = tensor("op_1023"), val = tensor([0, 2, 1, 3])]; tensor qk_17_transpose_x_0 = const()[name = tensor("qk_17_transpose_x_0"), val = tensor(false)]; tensor qk_17_transpose_y_0 = const()[name = tensor("qk_17_transpose_y_0"), val = tensor(false)]; tensor transpose_64_perm_0 = const()[name = tensor("transpose_64_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_65_perm_0 = const()[name = tensor("transpose_65_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_157 = transpose(perm = transpose_65_perm_0, x = k_35_cast); tensor transpose_158 = transpose(perm = transpose_64_perm_0, x = q_35_cast); tensor qk_17_cast = matmul(transpose_x = qk_17_transpose_x_0, transpose_y = qk_17_transpose_y_0, x = transpose_158, y = transpose_157); tensor var_1027_cast = softmax(axis = var_962, x = qk_17_cast); tensor var_1029_transpose_x_0 = const()[name = tensor("op_1029_transpose_x_0"), val = tensor(false)]; tensor var_1029_transpose_y_0 = const()[name = tensor("op_1029_transpose_y_0"), val = tensor(false)]; tensor transpose_159 = transpose(perm = var_1023, x = var_1022_cast); tensor var_1029_cast = matmul(transpose_x = var_1029_transpose_x_0, transpose_y = var_1029_transpose_y_0, x = var_1027_cast, y = transpose_159); tensor var_1030 = const()[name = tensor("op_1030"), val = tensor([0, 2, 1, 3])]; tensor concat_8 = const()[name = tensor("concat_8"), val = tensor([1, 1500, 1024])]; tensor transpose_156 = transpose(perm = var_1030, x = var_1029_cast); tensor x_107_cast = reshape(shape = concat_8, x = transpose_156); tensor var_1035_to_fp16 = const()[name = tensor("op_1035_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(217709440)))]; tensor var_1036_to_fp16 = const()[name = tensor("op_1036_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219806656)))]; tensor var_1037_cast = linear(bias = var_1036_to_fp16, weight = var_1035_to_fp16, x = x_107_cast); tensor x_109_cast = add(x = x_103_cast, y = var_1037_cast); tensor var_1043_axes_0 = const()[name = tensor("op_1043_axes_0"), val = tensor([-1])]; tensor blocks_8_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_8_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219808768)))]; tensor blocks_8_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_8_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219810880)))]; tensor var_1043_cast = layer_norm(axes = var_1043_axes_0, beta = blocks_8_mlp_ln_bias_to_fp16, epsilon = var_968_to_fp16, gamma = blocks_8_mlp_ln_weight_to_fp16, x = x_109_cast); tensor var_1052_to_fp16 = const()[name = tensor("op_1052_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(219812992)))]; tensor var_1053_to_fp16 = const()[name = tensor("op_1053_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(228201664)))]; tensor input_73_cast = linear(bias = var_1053_to_fp16, weight = var_1052_to_fp16, x = var_1043_cast); tensor x_113_mode_0 = const()[name = tensor("x_113_mode_0"), val = tensor("EXACT")]; tensor x_113_cast = gelu(mode = x_113_mode_0, x = input_73_cast); tensor var_1058_to_fp16 = const()[name = tensor("op_1058_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(228209920)))]; tensor var_1059_to_fp16 = const()[name = tensor("op_1059_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236598592)))]; tensor var_1060_cast = linear(bias = var_1059_to_fp16, weight = var_1058_to_fp16, x = x_113_cast); tensor x_115_cast = add(x = x_109_cast, y = var_1060_cast); tensor var_1069 = const()[name = tensor("op_1069"), val = tensor(-1)]; tensor var_1086_axes_0 = const()[name = tensor("op_1086_axes_0"), val = tensor([-1])]; tensor blocks_9_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_9_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236600704)))]; tensor blocks_9_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_9_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236602816)))]; tensor var_1075_to_fp16 = const()[name = tensor("op_1075_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1086_cast = layer_norm(axes = var_1086_axes_0, beta = blocks_9_attn_ln_bias_to_fp16, epsilon = var_1075_to_fp16, gamma = blocks_9_attn_ln_weight_to_fp16, x = x_115_cast); tensor var_1097_to_fp16 = const()[name = tensor("op_1097_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(236604928)))]; tensor var_1098_to_fp16 = const()[name = tensor("op_1098_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(238702144)))]; tensor q_37_cast = linear(bias = var_1098_to_fp16, weight = var_1097_to_fp16, x = var_1086_cast); tensor var_1101_to_fp16 = const()[name = tensor("op_1101_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(238704256)))]; tensor k_37_bias_0_to_fp16 = const()[name = tensor("k_37_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240801472)))]; tensor k_37_cast = linear(bias = k_37_bias_0_to_fp16, weight = var_1101_to_fp16, x = var_1086_cast); tensor var_1105_to_fp16 = const()[name = tensor("op_1105_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(240803584)))]; tensor var_1106_to_fp16 = const()[name = tensor("op_1106_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(242900800)))]; tensor v_37_cast = linear(bias = var_1106_to_fp16, weight = var_1105_to_fp16, x = var_1086_cast); tensor var_1114 = const()[name = tensor("op_1114"), val = tensor([1, 1500, 16, -1])]; tensor var_1115_cast = reshape(shape = var_1114, x = q_37_cast); tensor const_186_to_fp16 = const()[name = tensor("const_186_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_39_cast = mul(x = var_1115_cast, y = const_186_to_fp16); tensor var_1121 = const()[name = tensor("op_1121"), val = tensor([1, 1500, 16, -1])]; tensor var_1122_cast = reshape(shape = var_1121, x = k_37_cast); tensor const_187_to_fp16 = const()[name = tensor("const_187_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_39_cast = mul(x = var_1122_cast, y = const_187_to_fp16); tensor var_1128 = const()[name = tensor("op_1128"), val = tensor([1, 1500, 16, -1])]; tensor var_1129_cast = reshape(shape = var_1128, x = v_37_cast); tensor var_1130 = const()[name = tensor("op_1130"), val = tensor([0, 2, 1, 3])]; tensor qk_19_transpose_x_0 = const()[name = tensor("qk_19_transpose_x_0"), val = tensor(false)]; tensor qk_19_transpose_y_0 = const()[name = tensor("qk_19_transpose_y_0"), val = tensor(false)]; tensor transpose_66_perm_0 = const()[name = tensor("transpose_66_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_67_perm_0 = const()[name = tensor("transpose_67_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_153 = transpose(perm = transpose_67_perm_0, x = k_39_cast); tensor transpose_154 = transpose(perm = transpose_66_perm_0, x = q_39_cast); tensor qk_19_cast = matmul(transpose_x = qk_19_transpose_x_0, transpose_y = qk_19_transpose_y_0, x = transpose_154, y = transpose_153); tensor var_1134_cast = softmax(axis = var_1069, x = qk_19_cast); tensor var_1136_transpose_x_0 = const()[name = tensor("op_1136_transpose_x_0"), val = tensor(false)]; tensor var_1136_transpose_y_0 = const()[name = tensor("op_1136_transpose_y_0"), val = tensor(false)]; tensor transpose_155 = transpose(perm = var_1130, x = var_1129_cast); tensor var_1136_cast = matmul(transpose_x = var_1136_transpose_x_0, transpose_y = var_1136_transpose_y_0, x = var_1134_cast, y = transpose_155); tensor var_1137 = const()[name = tensor("op_1137"), val = tensor([0, 2, 1, 3])]; tensor concat_9 = const()[name = tensor("concat_9"), val = tensor([1, 1500, 1024])]; tensor transpose_152 = transpose(perm = var_1137, x = var_1136_cast); tensor x_119_cast = reshape(shape = concat_9, x = transpose_152); tensor var_1142_to_fp16 = const()[name = tensor("op_1142_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(242902912)))]; tensor var_1143_to_fp16 = const()[name = tensor("op_1143_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245000128)))]; tensor var_1144_cast = linear(bias = var_1143_to_fp16, weight = var_1142_to_fp16, x = x_119_cast); tensor x_121_cast = add(x = x_115_cast, y = var_1144_cast); tensor var_1150_axes_0 = const()[name = tensor("op_1150_axes_0"), val = tensor([-1])]; tensor blocks_9_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_9_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245002240)))]; tensor blocks_9_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_9_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245004352)))]; tensor var_1150_cast = layer_norm(axes = var_1150_axes_0, beta = blocks_9_mlp_ln_bias_to_fp16, epsilon = var_1075_to_fp16, gamma = blocks_9_mlp_ln_weight_to_fp16, x = x_121_cast); tensor var_1159_to_fp16 = const()[name = tensor("op_1159_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(245006464)))]; tensor var_1160_to_fp16 = const()[name = tensor("op_1160_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253395136)))]; tensor input_81_cast = linear(bias = var_1160_to_fp16, weight = var_1159_to_fp16, x = var_1150_cast); tensor x_125_mode_0 = const()[name = tensor("x_125_mode_0"), val = tensor("EXACT")]; tensor x_125_cast = gelu(mode = x_125_mode_0, x = input_81_cast); tensor var_1165_to_fp16 = const()[name = tensor("op_1165_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(253403392)))]; tensor var_1166_to_fp16 = const()[name = tensor("op_1166_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(261792064)))]; tensor var_1167_cast = linear(bias = var_1166_to_fp16, weight = var_1165_to_fp16, x = x_125_cast); tensor x_127_cast = add(x = x_121_cast, y = var_1167_cast); tensor var_1176 = const()[name = tensor("op_1176"), val = tensor(-1)]; tensor var_1193_axes_0 = const()[name = tensor("op_1193_axes_0"), val = tensor([-1])]; tensor blocks_10_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_10_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(261794176)))]; tensor blocks_10_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_10_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(261796288)))]; tensor var_1182_to_fp16 = const()[name = tensor("op_1182_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1193_cast = layer_norm(axes = var_1193_axes_0, beta = blocks_10_attn_ln_bias_to_fp16, epsilon = var_1182_to_fp16, gamma = blocks_10_attn_ln_weight_to_fp16, x = x_127_cast); tensor var_1204_to_fp16 = const()[name = tensor("op_1204_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(261798400)))]; tensor var_1205_to_fp16 = const()[name = tensor("op_1205_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263895616)))]; tensor q_41_cast = linear(bias = var_1205_to_fp16, weight = var_1204_to_fp16, x = var_1193_cast); tensor var_1208_to_fp16 = const()[name = tensor("op_1208_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(263897728)))]; tensor k_41_bias_0_to_fp16 = const()[name = tensor("k_41_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265994944)))]; tensor k_41_cast = linear(bias = k_41_bias_0_to_fp16, weight = var_1208_to_fp16, x = var_1193_cast); tensor var_1212_to_fp16 = const()[name = tensor("op_1212_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(265997056)))]; tensor var_1213_to_fp16 = const()[name = tensor("op_1213_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268094272)))]; tensor v_41_cast = linear(bias = var_1213_to_fp16, weight = var_1212_to_fp16, x = var_1193_cast); tensor var_1221 = const()[name = tensor("op_1221"), val = tensor([1, 1500, 16, -1])]; tensor var_1222_cast = reshape(shape = var_1221, x = q_41_cast); tensor const_188_to_fp16 = const()[name = tensor("const_188_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_43_cast = mul(x = var_1222_cast, y = const_188_to_fp16); tensor var_1228 = const()[name = tensor("op_1228"), val = tensor([1, 1500, 16, -1])]; tensor var_1229_cast = reshape(shape = var_1228, x = k_41_cast); tensor const_189_to_fp16 = const()[name = tensor("const_189_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_43_cast = mul(x = var_1229_cast, y = const_189_to_fp16); tensor var_1235 = const()[name = tensor("op_1235"), val = tensor([1, 1500, 16, -1])]; tensor var_1236_cast = reshape(shape = var_1235, x = v_41_cast); tensor var_1237 = const()[name = tensor("op_1237"), val = tensor([0, 2, 1, 3])]; tensor qk_21_transpose_x_0 = const()[name = tensor("qk_21_transpose_x_0"), val = tensor(false)]; tensor qk_21_transpose_y_0 = const()[name = tensor("qk_21_transpose_y_0"), val = tensor(false)]; tensor transpose_68_perm_0 = const()[name = tensor("transpose_68_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_69_perm_0 = const()[name = tensor("transpose_69_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_149 = transpose(perm = transpose_69_perm_0, x = k_43_cast); tensor transpose_150 = transpose(perm = transpose_68_perm_0, x = q_43_cast); tensor qk_21_cast = matmul(transpose_x = qk_21_transpose_x_0, transpose_y = qk_21_transpose_y_0, x = transpose_150, y = transpose_149); tensor var_1241_cast = softmax(axis = var_1176, x = qk_21_cast); tensor var_1243_transpose_x_0 = const()[name = tensor("op_1243_transpose_x_0"), val = tensor(false)]; tensor var_1243_transpose_y_0 = const()[name = tensor("op_1243_transpose_y_0"), val = tensor(false)]; tensor transpose_151 = transpose(perm = var_1237, x = var_1236_cast); tensor var_1243_cast = matmul(transpose_x = var_1243_transpose_x_0, transpose_y = var_1243_transpose_y_0, x = var_1241_cast, y = transpose_151); tensor var_1244 = const()[name = tensor("op_1244"), val = tensor([0, 2, 1, 3])]; tensor concat_10 = const()[name = tensor("concat_10"), val = tensor([1, 1500, 1024])]; tensor transpose_148 = transpose(perm = var_1244, x = var_1243_cast); tensor x_131_cast = reshape(shape = concat_10, x = transpose_148); tensor var_1249_to_fp16 = const()[name = tensor("op_1249_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(268096384)))]; tensor var_1250_to_fp16 = const()[name = tensor("op_1250_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270193600)))]; tensor var_1251_cast = linear(bias = var_1250_to_fp16, weight = var_1249_to_fp16, x = x_131_cast); tensor x_133_cast = add(x = x_127_cast, y = var_1251_cast); tensor var_1257_axes_0 = const()[name = tensor("op_1257_axes_0"), val = tensor([-1])]; tensor blocks_10_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_10_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270195712)))]; tensor blocks_10_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_10_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270197824)))]; tensor var_1257_cast = layer_norm(axes = var_1257_axes_0, beta = blocks_10_mlp_ln_bias_to_fp16, epsilon = var_1182_to_fp16, gamma = blocks_10_mlp_ln_weight_to_fp16, x = x_133_cast); tensor var_1266_to_fp16 = const()[name = tensor("op_1266_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(270199936)))]; tensor var_1267_to_fp16 = const()[name = tensor("op_1267_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278588608)))]; tensor input_89_cast = linear(bias = var_1267_to_fp16, weight = var_1266_to_fp16, x = var_1257_cast); tensor x_137_mode_0 = const()[name = tensor("x_137_mode_0"), val = tensor("EXACT")]; tensor x_137_cast = gelu(mode = x_137_mode_0, x = input_89_cast); tensor var_1272_to_fp16 = const()[name = tensor("op_1272_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(278596864)))]; tensor var_1273_to_fp16 = const()[name = tensor("op_1273_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286985536)))]; tensor var_1274_cast = linear(bias = var_1273_to_fp16, weight = var_1272_to_fp16, x = x_137_cast); tensor x_139_cast = add(x = x_133_cast, y = var_1274_cast); tensor var_1283 = const()[name = tensor("op_1283"), val = tensor(-1)]; tensor var_1300_axes_0 = const()[name = tensor("op_1300_axes_0"), val = tensor([-1])]; tensor blocks_11_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_11_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286987648)))]; tensor blocks_11_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_11_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286989760)))]; tensor var_1289_to_fp16 = const()[name = tensor("op_1289_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1300_cast = layer_norm(axes = var_1300_axes_0, beta = blocks_11_attn_ln_bias_to_fp16, epsilon = var_1289_to_fp16, gamma = blocks_11_attn_ln_weight_to_fp16, x = x_139_cast); tensor var_1311_to_fp16 = const()[name = tensor("op_1311_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(286991872)))]; tensor var_1312_to_fp16 = const()[name = tensor("op_1312_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(289089088)))]; tensor q_45_cast = linear(bias = var_1312_to_fp16, weight = var_1311_to_fp16, x = var_1300_cast); tensor var_1315_to_fp16 = const()[name = tensor("op_1315_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(289091200)))]; tensor k_45_bias_0_to_fp16 = const()[name = tensor("k_45_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291188416)))]; tensor k_45_cast = linear(bias = k_45_bias_0_to_fp16, weight = var_1315_to_fp16, x = var_1300_cast); tensor var_1319_to_fp16 = const()[name = tensor("op_1319_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(291190528)))]; tensor var_1320_to_fp16 = const()[name = tensor("op_1320_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293287744)))]; tensor v_45_cast = linear(bias = var_1320_to_fp16, weight = var_1319_to_fp16, x = var_1300_cast); tensor var_1328 = const()[name = tensor("op_1328"), val = tensor([1, 1500, 16, -1])]; tensor var_1329_cast = reshape(shape = var_1328, x = q_45_cast); tensor const_190_to_fp16 = const()[name = tensor("const_190_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_47_cast = mul(x = var_1329_cast, y = const_190_to_fp16); tensor var_1335 = const()[name = tensor("op_1335"), val = tensor([1, 1500, 16, -1])]; tensor var_1336_cast = reshape(shape = var_1335, x = k_45_cast); tensor const_191_to_fp16 = const()[name = tensor("const_191_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_47_cast = mul(x = var_1336_cast, y = const_191_to_fp16); tensor var_1342 = const()[name = tensor("op_1342"), val = tensor([1, 1500, 16, -1])]; tensor var_1343_cast = reshape(shape = var_1342, x = v_45_cast); tensor var_1344 = const()[name = tensor("op_1344"), val = tensor([0, 2, 1, 3])]; tensor qk_23_transpose_x_0 = const()[name = tensor("qk_23_transpose_x_0"), val = tensor(false)]; tensor qk_23_transpose_y_0 = const()[name = tensor("qk_23_transpose_y_0"), val = tensor(false)]; tensor transpose_70_perm_0 = const()[name = tensor("transpose_70_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_71_perm_0 = const()[name = tensor("transpose_71_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_145 = transpose(perm = transpose_71_perm_0, x = k_47_cast); tensor transpose_146 = transpose(perm = transpose_70_perm_0, x = q_47_cast); tensor qk_23_cast = matmul(transpose_x = qk_23_transpose_x_0, transpose_y = qk_23_transpose_y_0, x = transpose_146, y = transpose_145); tensor var_1348_cast = softmax(axis = var_1283, x = qk_23_cast); tensor var_1350_transpose_x_0 = const()[name = tensor("op_1350_transpose_x_0"), val = tensor(false)]; tensor var_1350_transpose_y_0 = const()[name = tensor("op_1350_transpose_y_0"), val = tensor(false)]; tensor transpose_147 = transpose(perm = var_1344, x = var_1343_cast); tensor var_1350_cast = matmul(transpose_x = var_1350_transpose_x_0, transpose_y = var_1350_transpose_y_0, x = var_1348_cast, y = transpose_147); tensor var_1351 = const()[name = tensor("op_1351"), val = tensor([0, 2, 1, 3])]; tensor concat_11 = const()[name = tensor("concat_11"), val = tensor([1, 1500, 1024])]; tensor transpose_144 = transpose(perm = var_1351, x = var_1350_cast); tensor x_143_cast = reshape(shape = concat_11, x = transpose_144); tensor var_1356_to_fp16 = const()[name = tensor("op_1356_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(293289856)))]; tensor var_1357_to_fp16 = const()[name = tensor("op_1357_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295387072)))]; tensor var_1358_cast = linear(bias = var_1357_to_fp16, weight = var_1356_to_fp16, x = x_143_cast); tensor x_145_cast = add(x = x_139_cast, y = var_1358_cast); tensor var_1364_axes_0 = const()[name = tensor("op_1364_axes_0"), val = tensor([-1])]; tensor blocks_11_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_11_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295389184)))]; tensor blocks_11_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_11_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295391296)))]; tensor var_1364_cast = layer_norm(axes = var_1364_axes_0, beta = blocks_11_mlp_ln_bias_to_fp16, epsilon = var_1289_to_fp16, gamma = blocks_11_mlp_ln_weight_to_fp16, x = x_145_cast); tensor var_1373_to_fp16 = const()[name = tensor("op_1373_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(295393408)))]; tensor var_1374_to_fp16 = const()[name = tensor("op_1374_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303782080)))]; tensor input_97_cast = linear(bias = var_1374_to_fp16, weight = var_1373_to_fp16, x = var_1364_cast); tensor x_149_mode_0 = const()[name = tensor("x_149_mode_0"), val = tensor("EXACT")]; tensor x_149_cast = gelu(mode = x_149_mode_0, x = input_97_cast); tensor var_1379_to_fp16 = const()[name = tensor("op_1379_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(303790336)))]; tensor var_1380_to_fp16 = const()[name = tensor("op_1380_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312179008)))]; tensor var_1381_cast = linear(bias = var_1380_to_fp16, weight = var_1379_to_fp16, x = x_149_cast); tensor x_151_cast = add(x = x_145_cast, y = var_1381_cast); tensor var_1390 = const()[name = tensor("op_1390"), val = tensor(-1)]; tensor var_1407_axes_0 = const()[name = tensor("op_1407_axes_0"), val = tensor([-1])]; tensor blocks_12_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_12_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312181120)))]; tensor blocks_12_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_12_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312183232)))]; tensor var_1396_to_fp16 = const()[name = tensor("op_1396_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1407_cast = layer_norm(axes = var_1407_axes_0, beta = blocks_12_attn_ln_bias_to_fp16, epsilon = var_1396_to_fp16, gamma = blocks_12_attn_ln_weight_to_fp16, x = x_151_cast); tensor var_1418_to_fp16 = const()[name = tensor("op_1418_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(312185344)))]; tensor var_1419_to_fp16 = const()[name = tensor("op_1419_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(314282560)))]; tensor q_49_cast = linear(bias = var_1419_to_fp16, weight = var_1418_to_fp16, x = var_1407_cast); tensor var_1422_to_fp16 = const()[name = tensor("op_1422_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(314284672)))]; tensor k_49_bias_0_to_fp16 = const()[name = tensor("k_49_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316381888)))]; tensor k_49_cast = linear(bias = k_49_bias_0_to_fp16, weight = var_1422_to_fp16, x = var_1407_cast); tensor var_1426_to_fp16 = const()[name = tensor("op_1426_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(316384000)))]; tensor var_1427_to_fp16 = const()[name = tensor("op_1427_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(318481216)))]; tensor v_49_cast = linear(bias = var_1427_to_fp16, weight = var_1426_to_fp16, x = var_1407_cast); tensor var_1435 = const()[name = tensor("op_1435"), val = tensor([1, 1500, 16, -1])]; tensor var_1436_cast = reshape(shape = var_1435, x = q_49_cast); tensor const_192_to_fp16 = const()[name = tensor("const_192_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_51_cast = mul(x = var_1436_cast, y = const_192_to_fp16); tensor var_1442 = const()[name = tensor("op_1442"), val = tensor([1, 1500, 16, -1])]; tensor var_1443_cast = reshape(shape = var_1442, x = k_49_cast); tensor const_193_to_fp16 = const()[name = tensor("const_193_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_51_cast = mul(x = var_1443_cast, y = const_193_to_fp16); tensor var_1449 = const()[name = tensor("op_1449"), val = tensor([1, 1500, 16, -1])]; tensor var_1450_cast = reshape(shape = var_1449, x = v_49_cast); tensor var_1451 = const()[name = tensor("op_1451"), val = tensor([0, 2, 1, 3])]; tensor qk_25_transpose_x_0 = const()[name = tensor("qk_25_transpose_x_0"), val = tensor(false)]; tensor qk_25_transpose_y_0 = const()[name = tensor("qk_25_transpose_y_0"), val = tensor(false)]; tensor transpose_72_perm_0 = const()[name = tensor("transpose_72_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_73_perm_0 = const()[name = tensor("transpose_73_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_141 = transpose(perm = transpose_73_perm_0, x = k_51_cast); tensor transpose_142 = transpose(perm = transpose_72_perm_0, x = q_51_cast); tensor qk_25_cast = matmul(transpose_x = qk_25_transpose_x_0, transpose_y = qk_25_transpose_y_0, x = transpose_142, y = transpose_141); tensor var_1455_cast = softmax(axis = var_1390, x = qk_25_cast); tensor var_1457_transpose_x_0 = const()[name = tensor("op_1457_transpose_x_0"), val = tensor(false)]; tensor var_1457_transpose_y_0 = const()[name = tensor("op_1457_transpose_y_0"), val = tensor(false)]; tensor transpose_143 = transpose(perm = var_1451, x = var_1450_cast); tensor var_1457_cast = matmul(transpose_x = var_1457_transpose_x_0, transpose_y = var_1457_transpose_y_0, x = var_1455_cast, y = transpose_143); tensor var_1458 = const()[name = tensor("op_1458"), val = tensor([0, 2, 1, 3])]; tensor concat_12 = const()[name = tensor("concat_12"), val = tensor([1, 1500, 1024])]; tensor transpose_140 = transpose(perm = var_1458, x = var_1457_cast); tensor x_155_cast = reshape(shape = concat_12, x = transpose_140); tensor var_1463_to_fp16 = const()[name = tensor("op_1463_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(318483328)))]; tensor var_1464_to_fp16 = const()[name = tensor("op_1464_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320580544)))]; tensor var_1465_cast = linear(bias = var_1464_to_fp16, weight = var_1463_to_fp16, x = x_155_cast); tensor x_157_cast = add(x = x_151_cast, y = var_1465_cast); tensor var_1471_axes_0 = const()[name = tensor("op_1471_axes_0"), val = tensor([-1])]; tensor blocks_12_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_12_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320582656)))]; tensor blocks_12_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_12_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320584768)))]; tensor var_1471_cast = layer_norm(axes = var_1471_axes_0, beta = blocks_12_mlp_ln_bias_to_fp16, epsilon = var_1396_to_fp16, gamma = blocks_12_mlp_ln_weight_to_fp16, x = x_157_cast); tensor var_1480_to_fp16 = const()[name = tensor("op_1480_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(320586880)))]; tensor var_1481_to_fp16 = const()[name = tensor("op_1481_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(328975552)))]; tensor input_105_cast = linear(bias = var_1481_to_fp16, weight = var_1480_to_fp16, x = var_1471_cast); tensor x_161_mode_0 = const()[name = tensor("x_161_mode_0"), val = tensor("EXACT")]; tensor x_161_cast = gelu(mode = x_161_mode_0, x = input_105_cast); tensor var_1486_to_fp16 = const()[name = tensor("op_1486_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(328983808)))]; tensor var_1487_to_fp16 = const()[name = tensor("op_1487_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337372480)))]; tensor var_1488_cast = linear(bias = var_1487_to_fp16, weight = var_1486_to_fp16, x = x_161_cast); tensor x_163_cast = add(x = x_157_cast, y = var_1488_cast); tensor var_1497 = const()[name = tensor("op_1497"), val = tensor(-1)]; tensor var_1514_axes_0 = const()[name = tensor("op_1514_axes_0"), val = tensor([-1])]; tensor blocks_13_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_13_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337374592)))]; tensor blocks_13_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_13_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337376704)))]; tensor var_1503_to_fp16 = const()[name = tensor("op_1503_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1514_cast = layer_norm(axes = var_1514_axes_0, beta = blocks_13_attn_ln_bias_to_fp16, epsilon = var_1503_to_fp16, gamma = blocks_13_attn_ln_weight_to_fp16, x = x_163_cast); tensor var_1525_to_fp16 = const()[name = tensor("op_1525_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(337378816)))]; tensor var_1526_to_fp16 = const()[name = tensor("op_1526_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339476032)))]; tensor q_53_cast = linear(bias = var_1526_to_fp16, weight = var_1525_to_fp16, x = var_1514_cast); tensor var_1529_to_fp16 = const()[name = tensor("op_1529_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(339478144)))]; tensor k_53_bias_0_to_fp16 = const()[name = tensor("k_53_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341575360)))]; tensor k_53_cast = linear(bias = k_53_bias_0_to_fp16, weight = var_1529_to_fp16, x = var_1514_cast); tensor var_1533_to_fp16 = const()[name = tensor("op_1533_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(341577472)))]; tensor var_1534_to_fp16 = const()[name = tensor("op_1534_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(343674688)))]; tensor v_53_cast = linear(bias = var_1534_to_fp16, weight = var_1533_to_fp16, x = var_1514_cast); tensor var_1542 = const()[name = tensor("op_1542"), val = tensor([1, 1500, 16, -1])]; tensor var_1543_cast = reshape(shape = var_1542, x = q_53_cast); tensor const_194_to_fp16 = const()[name = tensor("const_194_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_55_cast = mul(x = var_1543_cast, y = const_194_to_fp16); tensor var_1549 = const()[name = tensor("op_1549"), val = tensor([1, 1500, 16, -1])]; tensor var_1550_cast = reshape(shape = var_1549, x = k_53_cast); tensor const_195_to_fp16 = const()[name = tensor("const_195_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_55_cast = mul(x = var_1550_cast, y = const_195_to_fp16); tensor var_1556 = const()[name = tensor("op_1556"), val = tensor([1, 1500, 16, -1])]; tensor var_1557_cast = reshape(shape = var_1556, x = v_53_cast); tensor var_1558 = const()[name = tensor("op_1558"), val = tensor([0, 2, 1, 3])]; tensor qk_27_transpose_x_0 = const()[name = tensor("qk_27_transpose_x_0"), val = tensor(false)]; tensor qk_27_transpose_y_0 = const()[name = tensor("qk_27_transpose_y_0"), val = tensor(false)]; tensor transpose_74_perm_0 = const()[name = tensor("transpose_74_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_75_perm_0 = const()[name = tensor("transpose_75_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_137 = transpose(perm = transpose_75_perm_0, x = k_55_cast); tensor transpose_138 = transpose(perm = transpose_74_perm_0, x = q_55_cast); tensor qk_27_cast = matmul(transpose_x = qk_27_transpose_x_0, transpose_y = qk_27_transpose_y_0, x = transpose_138, y = transpose_137); tensor var_1562_cast = softmax(axis = var_1497, x = qk_27_cast); tensor var_1564_transpose_x_0 = const()[name = tensor("op_1564_transpose_x_0"), val = tensor(false)]; tensor var_1564_transpose_y_0 = const()[name = tensor("op_1564_transpose_y_0"), val = tensor(false)]; tensor transpose_139 = transpose(perm = var_1558, x = var_1557_cast); tensor var_1564_cast = matmul(transpose_x = var_1564_transpose_x_0, transpose_y = var_1564_transpose_y_0, x = var_1562_cast, y = transpose_139); tensor var_1565 = const()[name = tensor("op_1565"), val = tensor([0, 2, 1, 3])]; tensor concat_13 = const()[name = tensor("concat_13"), val = tensor([1, 1500, 1024])]; tensor transpose_136 = transpose(perm = var_1565, x = var_1564_cast); tensor x_167_cast = reshape(shape = concat_13, x = transpose_136); tensor var_1570_to_fp16 = const()[name = tensor("op_1570_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(343676800)))]; tensor var_1571_to_fp16 = const()[name = tensor("op_1571_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345774016)))]; tensor var_1572_cast = linear(bias = var_1571_to_fp16, weight = var_1570_to_fp16, x = x_167_cast); tensor x_169_cast = add(x = x_163_cast, y = var_1572_cast); tensor var_1578_axes_0 = const()[name = tensor("op_1578_axes_0"), val = tensor([-1])]; tensor blocks_13_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_13_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345776128)))]; tensor blocks_13_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_13_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345778240)))]; tensor var_1578_cast = layer_norm(axes = var_1578_axes_0, beta = blocks_13_mlp_ln_bias_to_fp16, epsilon = var_1503_to_fp16, gamma = blocks_13_mlp_ln_weight_to_fp16, x = x_169_cast); tensor var_1587_to_fp16 = const()[name = tensor("op_1587_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(345780352)))]; tensor var_1588_to_fp16 = const()[name = tensor("op_1588_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354169024)))]; tensor input_113_cast = linear(bias = var_1588_to_fp16, weight = var_1587_to_fp16, x = var_1578_cast); tensor x_173_mode_0 = const()[name = tensor("x_173_mode_0"), val = tensor("EXACT")]; tensor x_173_cast = gelu(mode = x_173_mode_0, x = input_113_cast); tensor var_1593_to_fp16 = const()[name = tensor("op_1593_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(354177280)))]; tensor var_1594_to_fp16 = const()[name = tensor("op_1594_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362565952)))]; tensor var_1595_cast = linear(bias = var_1594_to_fp16, weight = var_1593_to_fp16, x = x_173_cast); tensor x_175_cast = add(x = x_169_cast, y = var_1595_cast); tensor var_1604 = const()[name = tensor("op_1604"), val = tensor(-1)]; tensor var_1621_axes_0 = const()[name = tensor("op_1621_axes_0"), val = tensor([-1])]; tensor blocks_14_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_14_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362568064)))]; tensor blocks_14_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_14_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362570176)))]; tensor var_1610_to_fp16 = const()[name = tensor("op_1610_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1621_cast = layer_norm(axes = var_1621_axes_0, beta = blocks_14_attn_ln_bias_to_fp16, epsilon = var_1610_to_fp16, gamma = blocks_14_attn_ln_weight_to_fp16, x = x_175_cast); tensor var_1632_to_fp16 = const()[name = tensor("op_1632_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(362572288)))]; tensor var_1633_to_fp16 = const()[name = tensor("op_1633_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(364669504)))]; tensor q_57_cast = linear(bias = var_1633_to_fp16, weight = var_1632_to_fp16, x = var_1621_cast); tensor var_1636_to_fp16 = const()[name = tensor("op_1636_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(364671616)))]; tensor k_57_bias_0_to_fp16 = const()[name = tensor("k_57_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(366768832)))]; tensor k_57_cast = linear(bias = k_57_bias_0_to_fp16, weight = var_1636_to_fp16, x = var_1621_cast); tensor var_1640_to_fp16 = const()[name = tensor("op_1640_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(366770944)))]; tensor var_1641_to_fp16 = const()[name = tensor("op_1641_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368868160)))]; tensor v_57_cast = linear(bias = var_1641_to_fp16, weight = var_1640_to_fp16, x = var_1621_cast); tensor var_1649 = const()[name = tensor("op_1649"), val = tensor([1, 1500, 16, -1])]; tensor var_1650_cast = reshape(shape = var_1649, x = q_57_cast); tensor const_196_to_fp16 = const()[name = tensor("const_196_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_59_cast = mul(x = var_1650_cast, y = const_196_to_fp16); tensor var_1656 = const()[name = tensor("op_1656"), val = tensor([1, 1500, 16, -1])]; tensor var_1657_cast = reshape(shape = var_1656, x = k_57_cast); tensor const_197_to_fp16 = const()[name = tensor("const_197_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_59_cast = mul(x = var_1657_cast, y = const_197_to_fp16); tensor var_1663 = const()[name = tensor("op_1663"), val = tensor([1, 1500, 16, -1])]; tensor var_1664_cast = reshape(shape = var_1663, x = v_57_cast); tensor var_1665 = const()[name = tensor("op_1665"), val = tensor([0, 2, 1, 3])]; tensor qk_29_transpose_x_0 = const()[name = tensor("qk_29_transpose_x_0"), val = tensor(false)]; tensor qk_29_transpose_y_0 = const()[name = tensor("qk_29_transpose_y_0"), val = tensor(false)]; tensor transpose_76_perm_0 = const()[name = tensor("transpose_76_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_77_perm_0 = const()[name = tensor("transpose_77_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_133 = transpose(perm = transpose_77_perm_0, x = k_59_cast); tensor transpose_134 = transpose(perm = transpose_76_perm_0, x = q_59_cast); tensor qk_29_cast = matmul(transpose_x = qk_29_transpose_x_0, transpose_y = qk_29_transpose_y_0, x = transpose_134, y = transpose_133); tensor var_1669_cast = softmax(axis = var_1604, x = qk_29_cast); tensor var_1671_transpose_x_0 = const()[name = tensor("op_1671_transpose_x_0"), val = tensor(false)]; tensor var_1671_transpose_y_0 = const()[name = tensor("op_1671_transpose_y_0"), val = tensor(false)]; tensor transpose_135 = transpose(perm = var_1665, x = var_1664_cast); tensor var_1671_cast = matmul(transpose_x = var_1671_transpose_x_0, transpose_y = var_1671_transpose_y_0, x = var_1669_cast, y = transpose_135); tensor var_1672 = const()[name = tensor("op_1672"), val = tensor([0, 2, 1, 3])]; tensor concat_14 = const()[name = tensor("concat_14"), val = tensor([1, 1500, 1024])]; tensor transpose_132 = transpose(perm = var_1672, x = var_1671_cast); tensor x_179_cast = reshape(shape = concat_14, x = transpose_132); tensor var_1677_to_fp16 = const()[name = tensor("op_1677_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(368870272)))]; tensor var_1678_to_fp16 = const()[name = tensor("op_1678_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370967488)))]; tensor var_1679_cast = linear(bias = var_1678_to_fp16, weight = var_1677_to_fp16, x = x_179_cast); tensor x_181_cast = add(x = x_175_cast, y = var_1679_cast); tensor var_1685_axes_0 = const()[name = tensor("op_1685_axes_0"), val = tensor([-1])]; tensor blocks_14_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_14_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370969600)))]; tensor blocks_14_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_14_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370971712)))]; tensor var_1685_cast = layer_norm(axes = var_1685_axes_0, beta = blocks_14_mlp_ln_bias_to_fp16, epsilon = var_1610_to_fp16, gamma = blocks_14_mlp_ln_weight_to_fp16, x = x_181_cast); tensor var_1694_to_fp16 = const()[name = tensor("op_1694_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(370973824)))]; tensor var_1695_to_fp16 = const()[name = tensor("op_1695_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(379362496)))]; tensor input_121_cast = linear(bias = var_1695_to_fp16, weight = var_1694_to_fp16, x = var_1685_cast); tensor x_185_mode_0 = const()[name = tensor("x_185_mode_0"), val = tensor("EXACT")]; tensor x_185_cast = gelu(mode = x_185_mode_0, x = input_121_cast); tensor var_1700_to_fp16 = const()[name = tensor("op_1700_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(379370752)))]; tensor var_1701_to_fp16 = const()[name = tensor("op_1701_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387759424)))]; tensor var_1702_cast = linear(bias = var_1701_to_fp16, weight = var_1700_to_fp16, x = x_185_cast); tensor x_187_cast = add(x = x_181_cast, y = var_1702_cast); tensor var_1711 = const()[name = tensor("op_1711"), val = tensor(-1)]; tensor var_1728_axes_0 = const()[name = tensor("op_1728_axes_0"), val = tensor([-1])]; tensor blocks_15_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_15_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387761536)))]; tensor blocks_15_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_15_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387763648)))]; tensor var_1717_to_fp16 = const()[name = tensor("op_1717_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1728_cast = layer_norm(axes = var_1728_axes_0, beta = blocks_15_attn_ln_bias_to_fp16, epsilon = var_1717_to_fp16, gamma = blocks_15_attn_ln_weight_to_fp16, x = x_187_cast); tensor var_1739_to_fp16 = const()[name = tensor("op_1739_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(387765760)))]; tensor var_1740_to_fp16 = const()[name = tensor("op_1740_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(389862976)))]; tensor q_61_cast = linear(bias = var_1740_to_fp16, weight = var_1739_to_fp16, x = var_1728_cast); tensor var_1743_to_fp16 = const()[name = tensor("op_1743_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(389865088)))]; tensor k_61_bias_0_to_fp16 = const()[name = tensor("k_61_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(391962304)))]; tensor k_61_cast = linear(bias = k_61_bias_0_to_fp16, weight = var_1743_to_fp16, x = var_1728_cast); tensor var_1747_to_fp16 = const()[name = tensor("op_1747_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(391964416)))]; tensor var_1748_to_fp16 = const()[name = tensor("op_1748_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394061632)))]; tensor v_61_cast = linear(bias = var_1748_to_fp16, weight = var_1747_to_fp16, x = var_1728_cast); tensor var_1756 = const()[name = tensor("op_1756"), val = tensor([1, 1500, 16, -1])]; tensor var_1757_cast = reshape(shape = var_1756, x = q_61_cast); tensor const_198_to_fp16 = const()[name = tensor("const_198_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_63_cast = mul(x = var_1757_cast, y = const_198_to_fp16); tensor var_1763 = const()[name = tensor("op_1763"), val = tensor([1, 1500, 16, -1])]; tensor var_1764_cast = reshape(shape = var_1763, x = k_61_cast); tensor const_199_to_fp16 = const()[name = tensor("const_199_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_63_cast = mul(x = var_1764_cast, y = const_199_to_fp16); tensor var_1770 = const()[name = tensor("op_1770"), val = tensor([1, 1500, 16, -1])]; tensor var_1771_cast = reshape(shape = var_1770, x = v_61_cast); tensor var_1772 = const()[name = tensor("op_1772"), val = tensor([0, 2, 1, 3])]; tensor qk_31_transpose_x_0 = const()[name = tensor("qk_31_transpose_x_0"), val = tensor(false)]; tensor qk_31_transpose_y_0 = const()[name = tensor("qk_31_transpose_y_0"), val = tensor(false)]; tensor transpose_78_perm_0 = const()[name = tensor("transpose_78_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_79_perm_0 = const()[name = tensor("transpose_79_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_129 = transpose(perm = transpose_79_perm_0, x = k_63_cast); tensor transpose_130 = transpose(perm = transpose_78_perm_0, x = q_63_cast); tensor qk_31_cast = matmul(transpose_x = qk_31_transpose_x_0, transpose_y = qk_31_transpose_y_0, x = transpose_130, y = transpose_129); tensor var_1776_cast = softmax(axis = var_1711, x = qk_31_cast); tensor var_1778_transpose_x_0 = const()[name = tensor("op_1778_transpose_x_0"), val = tensor(false)]; tensor var_1778_transpose_y_0 = const()[name = tensor("op_1778_transpose_y_0"), val = tensor(false)]; tensor transpose_131 = transpose(perm = var_1772, x = var_1771_cast); tensor var_1778_cast = matmul(transpose_x = var_1778_transpose_x_0, transpose_y = var_1778_transpose_y_0, x = var_1776_cast, y = transpose_131); tensor var_1779 = const()[name = tensor("op_1779"), val = tensor([0, 2, 1, 3])]; tensor concat_15 = const()[name = tensor("concat_15"), val = tensor([1, 1500, 1024])]; tensor transpose_128 = transpose(perm = var_1779, x = var_1778_cast); tensor x_191_cast = reshape(shape = concat_15, x = transpose_128); tensor var_1784_to_fp16 = const()[name = tensor("op_1784_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(394063744)))]; tensor var_1785_to_fp16 = const()[name = tensor("op_1785_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(396160960)))]; tensor var_1786_cast = linear(bias = var_1785_to_fp16, weight = var_1784_to_fp16, x = x_191_cast); tensor x_193_cast = add(x = x_187_cast, y = var_1786_cast); tensor var_1792_axes_0 = const()[name = tensor("op_1792_axes_0"), val = tensor([-1])]; tensor blocks_15_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_15_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(396163072)))]; tensor blocks_15_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_15_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(396165184)))]; tensor var_1792_cast = layer_norm(axes = var_1792_axes_0, beta = blocks_15_mlp_ln_bias_to_fp16, epsilon = var_1717_to_fp16, gamma = blocks_15_mlp_ln_weight_to_fp16, x = x_193_cast); tensor var_1801_to_fp16 = const()[name = tensor("op_1801_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(396167296)))]; tensor var_1802_to_fp16 = const()[name = tensor("op_1802_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(404555968)))]; tensor input_129_cast = linear(bias = var_1802_to_fp16, weight = var_1801_to_fp16, x = var_1792_cast); tensor x_197_mode_0 = const()[name = tensor("x_197_mode_0"), val = tensor("EXACT")]; tensor x_197_cast = gelu(mode = x_197_mode_0, x = input_129_cast); tensor var_1807_to_fp16 = const()[name = tensor("op_1807_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(404564224)))]; tensor var_1808_to_fp16 = const()[name = tensor("op_1808_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412952896)))]; tensor var_1809_cast = linear(bias = var_1808_to_fp16, weight = var_1807_to_fp16, x = x_197_cast); tensor x_199_cast = add(x = x_193_cast, y = var_1809_cast); tensor var_1818 = const()[name = tensor("op_1818"), val = tensor(-1)]; tensor var_1835_axes_0 = const()[name = tensor("op_1835_axes_0"), val = tensor([-1])]; tensor blocks_16_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_16_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412955008)))]; tensor blocks_16_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_16_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412957120)))]; tensor var_1824_to_fp16 = const()[name = tensor("op_1824_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1835_cast = layer_norm(axes = var_1835_axes_0, beta = blocks_16_attn_ln_bias_to_fp16, epsilon = var_1824_to_fp16, gamma = blocks_16_attn_ln_weight_to_fp16, x = x_199_cast); tensor var_1846_to_fp16 = const()[name = tensor("op_1846_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(412959232)))]; tensor var_1847_to_fp16 = const()[name = tensor("op_1847_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415056448)))]; tensor q_65_cast = linear(bias = var_1847_to_fp16, weight = var_1846_to_fp16, x = var_1835_cast); tensor var_1850_to_fp16 = const()[name = tensor("op_1850_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(415058560)))]; tensor k_65_bias_0_to_fp16 = const()[name = tensor("k_65_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(417155776)))]; tensor k_65_cast = linear(bias = k_65_bias_0_to_fp16, weight = var_1850_to_fp16, x = var_1835_cast); tensor var_1854_to_fp16 = const()[name = tensor("op_1854_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(417157888)))]; tensor var_1855_to_fp16 = const()[name = tensor("op_1855_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419255104)))]; tensor v_65_cast = linear(bias = var_1855_to_fp16, weight = var_1854_to_fp16, x = var_1835_cast); tensor var_1863 = const()[name = tensor("op_1863"), val = tensor([1, 1500, 16, -1])]; tensor var_1864_cast = reshape(shape = var_1863, x = q_65_cast); tensor const_200_to_fp16 = const()[name = tensor("const_200_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_67_cast = mul(x = var_1864_cast, y = const_200_to_fp16); tensor var_1870 = const()[name = tensor("op_1870"), val = tensor([1, 1500, 16, -1])]; tensor var_1871_cast = reshape(shape = var_1870, x = k_65_cast); tensor const_201_to_fp16 = const()[name = tensor("const_201_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_67_cast = mul(x = var_1871_cast, y = const_201_to_fp16); tensor var_1877 = const()[name = tensor("op_1877"), val = tensor([1, 1500, 16, -1])]; tensor var_1878_cast = reshape(shape = var_1877, x = v_65_cast); tensor var_1879 = const()[name = tensor("op_1879"), val = tensor([0, 2, 1, 3])]; tensor qk_33_transpose_x_0 = const()[name = tensor("qk_33_transpose_x_0"), val = tensor(false)]; tensor qk_33_transpose_y_0 = const()[name = tensor("qk_33_transpose_y_0"), val = tensor(false)]; tensor transpose_80_perm_0 = const()[name = tensor("transpose_80_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_81_perm_0 = const()[name = tensor("transpose_81_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_125 = transpose(perm = transpose_81_perm_0, x = k_67_cast); tensor transpose_126 = transpose(perm = transpose_80_perm_0, x = q_67_cast); tensor qk_33_cast = matmul(transpose_x = qk_33_transpose_x_0, transpose_y = qk_33_transpose_y_0, x = transpose_126, y = transpose_125); tensor var_1883_cast = softmax(axis = var_1818, x = qk_33_cast); tensor var_1885_transpose_x_0 = const()[name = tensor("op_1885_transpose_x_0"), val = tensor(false)]; tensor var_1885_transpose_y_0 = const()[name = tensor("op_1885_transpose_y_0"), val = tensor(false)]; tensor transpose_127 = transpose(perm = var_1879, x = var_1878_cast); tensor var_1885_cast = matmul(transpose_x = var_1885_transpose_x_0, transpose_y = var_1885_transpose_y_0, x = var_1883_cast, y = transpose_127); tensor var_1886 = const()[name = tensor("op_1886"), val = tensor([0, 2, 1, 3])]; tensor concat_16 = const()[name = tensor("concat_16"), val = tensor([1, 1500, 1024])]; tensor transpose_124 = transpose(perm = var_1886, x = var_1885_cast); tensor x_203_cast = reshape(shape = concat_16, x = transpose_124); tensor var_1891_to_fp16 = const()[name = tensor("op_1891_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(419257216)))]; tensor var_1892_to_fp16 = const()[name = tensor("op_1892_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421354432)))]; tensor var_1893_cast = linear(bias = var_1892_to_fp16, weight = var_1891_to_fp16, x = x_203_cast); tensor x_205_cast = add(x = x_199_cast, y = var_1893_cast); tensor var_1899_axes_0 = const()[name = tensor("op_1899_axes_0"), val = tensor([-1])]; tensor blocks_16_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_16_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421356544)))]; tensor blocks_16_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_16_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421358656)))]; tensor var_1899_cast = layer_norm(axes = var_1899_axes_0, beta = blocks_16_mlp_ln_bias_to_fp16, epsilon = var_1824_to_fp16, gamma = blocks_16_mlp_ln_weight_to_fp16, x = x_205_cast); tensor var_1908_to_fp16 = const()[name = tensor("op_1908_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(421360768)))]; tensor var_1909_to_fp16 = const()[name = tensor("op_1909_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(429749440)))]; tensor input_137_cast = linear(bias = var_1909_to_fp16, weight = var_1908_to_fp16, x = var_1899_cast); tensor x_209_mode_0 = const()[name = tensor("x_209_mode_0"), val = tensor("EXACT")]; tensor x_209_cast = gelu(mode = x_209_mode_0, x = input_137_cast); tensor var_1914_to_fp16 = const()[name = tensor("op_1914_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(429757696)))]; tensor var_1915_to_fp16 = const()[name = tensor("op_1915_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(438146368)))]; tensor var_1916_cast = linear(bias = var_1915_to_fp16, weight = var_1914_to_fp16, x = x_209_cast); tensor x_211_cast = add(x = x_205_cast, y = var_1916_cast); tensor var_1925 = const()[name = tensor("op_1925"), val = tensor(-1)]; tensor var_1942_axes_0 = const()[name = tensor("op_1942_axes_0"), val = tensor([-1])]; tensor blocks_17_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_17_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(438148480)))]; tensor blocks_17_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_17_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(438150592)))]; tensor var_1931_to_fp16 = const()[name = tensor("op_1931_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_1942_cast = layer_norm(axes = var_1942_axes_0, beta = blocks_17_attn_ln_bias_to_fp16, epsilon = var_1931_to_fp16, gamma = blocks_17_attn_ln_weight_to_fp16, x = x_211_cast); tensor var_1953_to_fp16 = const()[name = tensor("op_1953_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(438152704)))]; tensor var_1954_to_fp16 = const()[name = tensor("op_1954_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(440249920)))]; tensor q_69_cast = linear(bias = var_1954_to_fp16, weight = var_1953_to_fp16, x = var_1942_cast); tensor var_1957_to_fp16 = const()[name = tensor("op_1957_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(440252032)))]; tensor k_69_bias_0_to_fp16 = const()[name = tensor("k_69_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442349248)))]; tensor k_69_cast = linear(bias = k_69_bias_0_to_fp16, weight = var_1957_to_fp16, x = var_1942_cast); tensor var_1961_to_fp16 = const()[name = tensor("op_1961_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(442351360)))]; tensor var_1962_to_fp16 = const()[name = tensor("op_1962_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(444448576)))]; tensor v_69_cast = linear(bias = var_1962_to_fp16, weight = var_1961_to_fp16, x = var_1942_cast); tensor var_1970 = const()[name = tensor("op_1970"), val = tensor([1, 1500, 16, -1])]; tensor var_1971_cast = reshape(shape = var_1970, x = q_69_cast); tensor const_202_to_fp16 = const()[name = tensor("const_202_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_71_cast = mul(x = var_1971_cast, y = const_202_to_fp16); tensor var_1977 = const()[name = tensor("op_1977"), val = tensor([1, 1500, 16, -1])]; tensor var_1978_cast = reshape(shape = var_1977, x = k_69_cast); tensor const_203_to_fp16 = const()[name = tensor("const_203_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_71_cast = mul(x = var_1978_cast, y = const_203_to_fp16); tensor var_1984 = const()[name = tensor("op_1984"), val = tensor([1, 1500, 16, -1])]; tensor var_1985_cast = reshape(shape = var_1984, x = v_69_cast); tensor var_1986 = const()[name = tensor("op_1986"), val = tensor([0, 2, 1, 3])]; tensor qk_35_transpose_x_0 = const()[name = tensor("qk_35_transpose_x_0"), val = tensor(false)]; tensor qk_35_transpose_y_0 = const()[name = tensor("qk_35_transpose_y_0"), val = tensor(false)]; tensor transpose_82_perm_0 = const()[name = tensor("transpose_82_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_83_perm_0 = const()[name = tensor("transpose_83_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_121 = transpose(perm = transpose_83_perm_0, x = k_71_cast); tensor transpose_122 = transpose(perm = transpose_82_perm_0, x = q_71_cast); tensor qk_35_cast = matmul(transpose_x = qk_35_transpose_x_0, transpose_y = qk_35_transpose_y_0, x = transpose_122, y = transpose_121); tensor var_1990_cast = softmax(axis = var_1925, x = qk_35_cast); tensor var_1992_transpose_x_0 = const()[name = tensor("op_1992_transpose_x_0"), val = tensor(false)]; tensor var_1992_transpose_y_0 = const()[name = tensor("op_1992_transpose_y_0"), val = tensor(false)]; tensor transpose_123 = transpose(perm = var_1986, x = var_1985_cast); tensor var_1992_cast = matmul(transpose_x = var_1992_transpose_x_0, transpose_y = var_1992_transpose_y_0, x = var_1990_cast, y = transpose_123); tensor var_1993 = const()[name = tensor("op_1993"), val = tensor([0, 2, 1, 3])]; tensor concat_17 = const()[name = tensor("concat_17"), val = tensor([1, 1500, 1024])]; tensor transpose_120 = transpose(perm = var_1993, x = var_1992_cast); tensor x_215_cast = reshape(shape = concat_17, x = transpose_120); tensor var_1998_to_fp16 = const()[name = tensor("op_1998_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(444450688)))]; tensor var_1999_to_fp16 = const()[name = tensor("op_1999_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446547904)))]; tensor var_2000_cast = linear(bias = var_1999_to_fp16, weight = var_1998_to_fp16, x = x_215_cast); tensor x_217_cast = add(x = x_211_cast, y = var_2000_cast); tensor var_2006_axes_0 = const()[name = tensor("op_2006_axes_0"), val = tensor([-1])]; tensor blocks_17_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_17_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446550016)))]; tensor blocks_17_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_17_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446552128)))]; tensor var_2006_cast = layer_norm(axes = var_2006_axes_0, beta = blocks_17_mlp_ln_bias_to_fp16, epsilon = var_1931_to_fp16, gamma = blocks_17_mlp_ln_weight_to_fp16, x = x_217_cast); tensor var_2015_to_fp16 = const()[name = tensor("op_2015_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(446554240)))]; tensor var_2016_to_fp16 = const()[name = tensor("op_2016_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454942912)))]; tensor input_145_cast = linear(bias = var_2016_to_fp16, weight = var_2015_to_fp16, x = var_2006_cast); tensor x_221_mode_0 = const()[name = tensor("x_221_mode_0"), val = tensor("EXACT")]; tensor x_221_cast = gelu(mode = x_221_mode_0, x = input_145_cast); tensor var_2021_to_fp16 = const()[name = tensor("op_2021_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(454951168)))]; tensor var_2022_to_fp16 = const()[name = tensor("op_2022_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(463339840)))]; tensor var_2023_cast = linear(bias = var_2022_to_fp16, weight = var_2021_to_fp16, x = x_221_cast); tensor x_223_cast = add(x = x_217_cast, y = var_2023_cast); tensor var_2032 = const()[name = tensor("op_2032"), val = tensor(-1)]; tensor var_2049_axes_0 = const()[name = tensor("op_2049_axes_0"), val = tensor([-1])]; tensor blocks_18_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_18_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(463341952)))]; tensor blocks_18_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_18_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(463344064)))]; tensor var_2038_to_fp16 = const()[name = tensor("op_2038_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2049_cast = layer_norm(axes = var_2049_axes_0, beta = blocks_18_attn_ln_bias_to_fp16, epsilon = var_2038_to_fp16, gamma = blocks_18_attn_ln_weight_to_fp16, x = x_223_cast); tensor var_2060_to_fp16 = const()[name = tensor("op_2060_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(463346176)))]; tensor var_2061_to_fp16 = const()[name = tensor("op_2061_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(465443392)))]; tensor q_73_cast = linear(bias = var_2061_to_fp16, weight = var_2060_to_fp16, x = var_2049_cast); tensor var_2064_to_fp16 = const()[name = tensor("op_2064_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(465445504)))]; tensor k_73_bias_0_to_fp16 = const()[name = tensor("k_73_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(467542720)))]; tensor k_73_cast = linear(bias = k_73_bias_0_to_fp16, weight = var_2064_to_fp16, x = var_2049_cast); tensor var_2068_to_fp16 = const()[name = tensor("op_2068_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(467544832)))]; tensor var_2069_to_fp16 = const()[name = tensor("op_2069_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(469642048)))]; tensor v_73_cast = linear(bias = var_2069_to_fp16, weight = var_2068_to_fp16, x = var_2049_cast); tensor var_2077 = const()[name = tensor("op_2077"), val = tensor([1, 1500, 16, -1])]; tensor var_2078_cast = reshape(shape = var_2077, x = q_73_cast); tensor const_204_to_fp16 = const()[name = tensor("const_204_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_75_cast = mul(x = var_2078_cast, y = const_204_to_fp16); tensor var_2084 = const()[name = tensor("op_2084"), val = tensor([1, 1500, 16, -1])]; tensor var_2085_cast = reshape(shape = var_2084, x = k_73_cast); tensor const_205_to_fp16 = const()[name = tensor("const_205_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_75_cast = mul(x = var_2085_cast, y = const_205_to_fp16); tensor var_2091 = const()[name = tensor("op_2091"), val = tensor([1, 1500, 16, -1])]; tensor var_2092_cast = reshape(shape = var_2091, x = v_73_cast); tensor var_2093 = const()[name = tensor("op_2093"), val = tensor([0, 2, 1, 3])]; tensor qk_37_transpose_x_0 = const()[name = tensor("qk_37_transpose_x_0"), val = tensor(false)]; tensor qk_37_transpose_y_0 = const()[name = tensor("qk_37_transpose_y_0"), val = tensor(false)]; tensor transpose_84_perm_0 = const()[name = tensor("transpose_84_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_85_perm_0 = const()[name = tensor("transpose_85_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_117 = transpose(perm = transpose_85_perm_0, x = k_75_cast); tensor transpose_118 = transpose(perm = transpose_84_perm_0, x = q_75_cast); tensor qk_37_cast = matmul(transpose_x = qk_37_transpose_x_0, transpose_y = qk_37_transpose_y_0, x = transpose_118, y = transpose_117); tensor var_2097_cast = softmax(axis = var_2032, x = qk_37_cast); tensor var_2099_transpose_x_0 = const()[name = tensor("op_2099_transpose_x_0"), val = tensor(false)]; tensor var_2099_transpose_y_0 = const()[name = tensor("op_2099_transpose_y_0"), val = tensor(false)]; tensor transpose_119 = transpose(perm = var_2093, x = var_2092_cast); tensor var_2099_cast = matmul(transpose_x = var_2099_transpose_x_0, transpose_y = var_2099_transpose_y_0, x = var_2097_cast, y = transpose_119); tensor var_2100 = const()[name = tensor("op_2100"), val = tensor([0, 2, 1, 3])]; tensor concat_18 = const()[name = tensor("concat_18"), val = tensor([1, 1500, 1024])]; tensor transpose_116 = transpose(perm = var_2100, x = var_2099_cast); tensor x_227_cast = reshape(shape = concat_18, x = transpose_116); tensor var_2105_to_fp16 = const()[name = tensor("op_2105_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(469644160)))]; tensor var_2106_to_fp16 = const()[name = tensor("op_2106_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(471741376)))]; tensor var_2107_cast = linear(bias = var_2106_to_fp16, weight = var_2105_to_fp16, x = x_227_cast); tensor x_229_cast = add(x = x_223_cast, y = var_2107_cast); tensor var_2113_axes_0 = const()[name = tensor("op_2113_axes_0"), val = tensor([-1])]; tensor blocks_18_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_18_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(471743488)))]; tensor blocks_18_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_18_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(471745600)))]; tensor var_2113_cast = layer_norm(axes = var_2113_axes_0, beta = blocks_18_mlp_ln_bias_to_fp16, epsilon = var_2038_to_fp16, gamma = blocks_18_mlp_ln_weight_to_fp16, x = x_229_cast); tensor var_2122_to_fp16 = const()[name = tensor("op_2122_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(471747712)))]; tensor var_2123_to_fp16 = const()[name = tensor("op_2123_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(480136384)))]; tensor input_153_cast = linear(bias = var_2123_to_fp16, weight = var_2122_to_fp16, x = var_2113_cast); tensor x_233_mode_0 = const()[name = tensor("x_233_mode_0"), val = tensor("EXACT")]; tensor x_233_cast = gelu(mode = x_233_mode_0, x = input_153_cast); tensor var_2128_to_fp16 = const()[name = tensor("op_2128_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(480144640)))]; tensor var_2129_to_fp16 = const()[name = tensor("op_2129_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488533312)))]; tensor var_2130_cast = linear(bias = var_2129_to_fp16, weight = var_2128_to_fp16, x = x_233_cast); tensor x_235_cast = add(x = x_229_cast, y = var_2130_cast); tensor var_2139 = const()[name = tensor("op_2139"), val = tensor(-1)]; tensor var_2156_axes_0 = const()[name = tensor("op_2156_axes_0"), val = tensor([-1])]; tensor blocks_19_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_19_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488535424)))]; tensor blocks_19_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_19_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488537536)))]; tensor var_2145_to_fp16 = const()[name = tensor("op_2145_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2156_cast = layer_norm(axes = var_2156_axes_0, beta = blocks_19_attn_ln_bias_to_fp16, epsilon = var_2145_to_fp16, gamma = blocks_19_attn_ln_weight_to_fp16, x = x_235_cast); tensor var_2167_to_fp16 = const()[name = tensor("op_2167_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(488539648)))]; tensor var_2168_to_fp16 = const()[name = tensor("op_2168_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490636864)))]; tensor q_77_cast = linear(bias = var_2168_to_fp16, weight = var_2167_to_fp16, x = var_2156_cast); tensor var_2171_to_fp16 = const()[name = tensor("op_2171_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(490638976)))]; tensor k_77_bias_0_to_fp16 = const()[name = tensor("k_77_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492736192)))]; tensor k_77_cast = linear(bias = k_77_bias_0_to_fp16, weight = var_2171_to_fp16, x = var_2156_cast); tensor var_2175_to_fp16 = const()[name = tensor("op_2175_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(492738304)))]; tensor var_2176_to_fp16 = const()[name = tensor("op_2176_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(494835520)))]; tensor v_77_cast = linear(bias = var_2176_to_fp16, weight = var_2175_to_fp16, x = var_2156_cast); tensor var_2184 = const()[name = tensor("op_2184"), val = tensor([1, 1500, 16, -1])]; tensor var_2185_cast = reshape(shape = var_2184, x = q_77_cast); tensor const_206_to_fp16 = const()[name = tensor("const_206_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_79_cast = mul(x = var_2185_cast, y = const_206_to_fp16); tensor var_2191 = const()[name = tensor("op_2191"), val = tensor([1, 1500, 16, -1])]; tensor var_2192_cast = reshape(shape = var_2191, x = k_77_cast); tensor const_207_to_fp16 = const()[name = tensor("const_207_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_79_cast = mul(x = var_2192_cast, y = const_207_to_fp16); tensor var_2198 = const()[name = tensor("op_2198"), val = tensor([1, 1500, 16, -1])]; tensor var_2199_cast = reshape(shape = var_2198, x = v_77_cast); tensor var_2200 = const()[name = tensor("op_2200"), val = tensor([0, 2, 1, 3])]; tensor qk_39_transpose_x_0 = const()[name = tensor("qk_39_transpose_x_0"), val = tensor(false)]; tensor qk_39_transpose_y_0 = const()[name = tensor("qk_39_transpose_y_0"), val = tensor(false)]; tensor transpose_86_perm_0 = const()[name = tensor("transpose_86_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_87_perm_0 = const()[name = tensor("transpose_87_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_113 = transpose(perm = transpose_87_perm_0, x = k_79_cast); tensor transpose_114 = transpose(perm = transpose_86_perm_0, x = q_79_cast); tensor qk_39_cast = matmul(transpose_x = qk_39_transpose_x_0, transpose_y = qk_39_transpose_y_0, x = transpose_114, y = transpose_113); tensor var_2204_cast = softmax(axis = var_2139, x = qk_39_cast); tensor var_2206_transpose_x_0 = const()[name = tensor("op_2206_transpose_x_0"), val = tensor(false)]; tensor var_2206_transpose_y_0 = const()[name = tensor("op_2206_transpose_y_0"), val = tensor(false)]; tensor transpose_115 = transpose(perm = var_2200, x = var_2199_cast); tensor var_2206_cast = matmul(transpose_x = var_2206_transpose_x_0, transpose_y = var_2206_transpose_y_0, x = var_2204_cast, y = transpose_115); tensor var_2207 = const()[name = tensor("op_2207"), val = tensor([0, 2, 1, 3])]; tensor concat_19 = const()[name = tensor("concat_19"), val = tensor([1, 1500, 1024])]; tensor transpose_112 = transpose(perm = var_2207, x = var_2206_cast); tensor x_239_cast = reshape(shape = concat_19, x = transpose_112); tensor var_2212_to_fp16 = const()[name = tensor("op_2212_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(494837632)))]; tensor var_2213_to_fp16 = const()[name = tensor("op_2213_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496934848)))]; tensor var_2214_cast = linear(bias = var_2213_to_fp16, weight = var_2212_to_fp16, x = x_239_cast); tensor x_241_cast = add(x = x_235_cast, y = var_2214_cast); tensor var_2220_axes_0 = const()[name = tensor("op_2220_axes_0"), val = tensor([-1])]; tensor blocks_19_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_19_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496936960)))]; tensor blocks_19_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_19_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496939072)))]; tensor var_2220_cast = layer_norm(axes = var_2220_axes_0, beta = blocks_19_mlp_ln_bias_to_fp16, epsilon = var_2145_to_fp16, gamma = blocks_19_mlp_ln_weight_to_fp16, x = x_241_cast); tensor var_2229_to_fp16 = const()[name = tensor("op_2229_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(496941184)))]; tensor var_2230_to_fp16 = const()[name = tensor("op_2230_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(505329856)))]; tensor input_161_cast = linear(bias = var_2230_to_fp16, weight = var_2229_to_fp16, x = var_2220_cast); tensor x_245_mode_0 = const()[name = tensor("x_245_mode_0"), val = tensor("EXACT")]; tensor x_245_cast = gelu(mode = x_245_mode_0, x = input_161_cast); tensor var_2235_to_fp16 = const()[name = tensor("op_2235_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(505338112)))]; tensor var_2236_to_fp16 = const()[name = tensor("op_2236_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513726784)))]; tensor var_2237_cast = linear(bias = var_2236_to_fp16, weight = var_2235_to_fp16, x = x_245_cast); tensor x_247_cast = add(x = x_241_cast, y = var_2237_cast); tensor var_2246 = const()[name = tensor("op_2246"), val = tensor(-1)]; tensor var_2263_axes_0 = const()[name = tensor("op_2263_axes_0"), val = tensor([-1])]; tensor blocks_20_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_20_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513728896)))]; tensor blocks_20_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_20_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513731008)))]; tensor var_2252_to_fp16 = const()[name = tensor("op_2252_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2263_cast = layer_norm(axes = var_2263_axes_0, beta = blocks_20_attn_ln_bias_to_fp16, epsilon = var_2252_to_fp16, gamma = blocks_20_attn_ln_weight_to_fp16, x = x_247_cast); tensor var_2274_to_fp16 = const()[name = tensor("op_2274_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(513733120)))]; tensor var_2275_to_fp16 = const()[name = tensor("op_2275_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(515830336)))]; tensor q_81_cast = linear(bias = var_2275_to_fp16, weight = var_2274_to_fp16, x = var_2263_cast); tensor var_2278_to_fp16 = const()[name = tensor("op_2278_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(515832448)))]; tensor k_81_bias_0_to_fp16 = const()[name = tensor("k_81_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(517929664)))]; tensor k_81_cast = linear(bias = k_81_bias_0_to_fp16, weight = var_2278_to_fp16, x = var_2263_cast); tensor var_2282_to_fp16 = const()[name = tensor("op_2282_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(517931776)))]; tensor var_2283_to_fp16 = const()[name = tensor("op_2283_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(520028992)))]; tensor v_81_cast = linear(bias = var_2283_to_fp16, weight = var_2282_to_fp16, x = var_2263_cast); tensor var_2291 = const()[name = tensor("op_2291"), val = tensor([1, 1500, 16, -1])]; tensor var_2292_cast = reshape(shape = var_2291, x = q_81_cast); tensor const_208_to_fp16 = const()[name = tensor("const_208_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_83_cast = mul(x = var_2292_cast, y = const_208_to_fp16); tensor var_2298 = const()[name = tensor("op_2298"), val = tensor([1, 1500, 16, -1])]; tensor var_2299_cast = reshape(shape = var_2298, x = k_81_cast); tensor const_209_to_fp16 = const()[name = tensor("const_209_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_83_cast = mul(x = var_2299_cast, y = const_209_to_fp16); tensor var_2305 = const()[name = tensor("op_2305"), val = tensor([1, 1500, 16, -1])]; tensor var_2306_cast = reshape(shape = var_2305, x = v_81_cast); tensor var_2307 = const()[name = tensor("op_2307"), val = tensor([0, 2, 1, 3])]; tensor qk_41_transpose_x_0 = const()[name = tensor("qk_41_transpose_x_0"), val = tensor(false)]; tensor qk_41_transpose_y_0 = const()[name = tensor("qk_41_transpose_y_0"), val = tensor(false)]; tensor transpose_88_perm_0 = const()[name = tensor("transpose_88_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_89_perm_0 = const()[name = tensor("transpose_89_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_109 = transpose(perm = transpose_89_perm_0, x = k_83_cast); tensor transpose_110 = transpose(perm = transpose_88_perm_0, x = q_83_cast); tensor qk_41_cast = matmul(transpose_x = qk_41_transpose_x_0, transpose_y = qk_41_transpose_y_0, x = transpose_110, y = transpose_109); tensor var_2311_cast = softmax(axis = var_2246, x = qk_41_cast); tensor var_2313_transpose_x_0 = const()[name = tensor("op_2313_transpose_x_0"), val = tensor(false)]; tensor var_2313_transpose_y_0 = const()[name = tensor("op_2313_transpose_y_0"), val = tensor(false)]; tensor transpose_111 = transpose(perm = var_2307, x = var_2306_cast); tensor var_2313_cast = matmul(transpose_x = var_2313_transpose_x_0, transpose_y = var_2313_transpose_y_0, x = var_2311_cast, y = transpose_111); tensor var_2314 = const()[name = tensor("op_2314"), val = tensor([0, 2, 1, 3])]; tensor concat_20 = const()[name = tensor("concat_20"), val = tensor([1, 1500, 1024])]; tensor transpose_108 = transpose(perm = var_2314, x = var_2313_cast); tensor x_251_cast = reshape(shape = concat_20, x = transpose_108); tensor var_2319_to_fp16 = const()[name = tensor("op_2319_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(520031104)))]; tensor var_2320_to_fp16 = const()[name = tensor("op_2320_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(522128320)))]; tensor var_2321_cast = linear(bias = var_2320_to_fp16, weight = var_2319_to_fp16, x = x_251_cast); tensor x_253_cast = add(x = x_247_cast, y = var_2321_cast); tensor var_2327_axes_0 = const()[name = tensor("op_2327_axes_0"), val = tensor([-1])]; tensor blocks_20_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_20_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(522130432)))]; tensor blocks_20_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_20_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(522132544)))]; tensor var_2327_cast = layer_norm(axes = var_2327_axes_0, beta = blocks_20_mlp_ln_bias_to_fp16, epsilon = var_2252_to_fp16, gamma = blocks_20_mlp_ln_weight_to_fp16, x = x_253_cast); tensor var_2336_to_fp16 = const()[name = tensor("op_2336_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(522134656)))]; tensor var_2337_to_fp16 = const()[name = tensor("op_2337_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(530523328)))]; tensor input_169_cast = linear(bias = var_2337_to_fp16, weight = var_2336_to_fp16, x = var_2327_cast); tensor x_257_mode_0 = const()[name = tensor("x_257_mode_0"), val = tensor("EXACT")]; tensor x_257_cast = gelu(mode = x_257_mode_0, x = input_169_cast); tensor var_2342_to_fp16 = const()[name = tensor("op_2342_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(530531584)))]; tensor var_2343_to_fp16 = const()[name = tensor("op_2343_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538920256)))]; tensor var_2344_cast = linear(bias = var_2343_to_fp16, weight = var_2342_to_fp16, x = x_257_cast); tensor x_259_cast = add(x = x_253_cast, y = var_2344_cast); tensor var_2353 = const()[name = tensor("op_2353"), val = tensor(-1)]; tensor var_2370_axes_0 = const()[name = tensor("op_2370_axes_0"), val = tensor([-1])]; tensor blocks_21_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_21_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538922368)))]; tensor blocks_21_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_21_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538924480)))]; tensor var_2359_to_fp16 = const()[name = tensor("op_2359_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2370_cast = layer_norm(axes = var_2370_axes_0, beta = blocks_21_attn_ln_bias_to_fp16, epsilon = var_2359_to_fp16, gamma = blocks_21_attn_ln_weight_to_fp16, x = x_259_cast); tensor var_2381_to_fp16 = const()[name = tensor("op_2381_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(538926592)))]; tensor var_2382_to_fp16 = const()[name = tensor("op_2382_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(541023808)))]; tensor q_85_cast = linear(bias = var_2382_to_fp16, weight = var_2381_to_fp16, x = var_2370_cast); tensor var_2385_to_fp16 = const()[name = tensor("op_2385_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(541025920)))]; tensor k_85_bias_0_to_fp16 = const()[name = tensor("k_85_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(543123136)))]; tensor k_85_cast = linear(bias = k_85_bias_0_to_fp16, weight = var_2385_to_fp16, x = var_2370_cast); tensor var_2389_to_fp16 = const()[name = tensor("op_2389_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(543125248)))]; tensor var_2390_to_fp16 = const()[name = tensor("op_2390_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(545222464)))]; tensor v_85_cast = linear(bias = var_2390_to_fp16, weight = var_2389_to_fp16, x = var_2370_cast); tensor var_2398 = const()[name = tensor("op_2398"), val = tensor([1, 1500, 16, -1])]; tensor var_2399_cast = reshape(shape = var_2398, x = q_85_cast); tensor const_210_to_fp16 = const()[name = tensor("const_210_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_87_cast = mul(x = var_2399_cast, y = const_210_to_fp16); tensor var_2405 = const()[name = tensor("op_2405"), val = tensor([1, 1500, 16, -1])]; tensor var_2406_cast = reshape(shape = var_2405, x = k_85_cast); tensor const_211_to_fp16 = const()[name = tensor("const_211_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_87_cast = mul(x = var_2406_cast, y = const_211_to_fp16); tensor var_2412 = const()[name = tensor("op_2412"), val = tensor([1, 1500, 16, -1])]; tensor var_2413_cast = reshape(shape = var_2412, x = v_85_cast); tensor var_2414 = const()[name = tensor("op_2414"), val = tensor([0, 2, 1, 3])]; tensor qk_43_transpose_x_0 = const()[name = tensor("qk_43_transpose_x_0"), val = tensor(false)]; tensor qk_43_transpose_y_0 = const()[name = tensor("qk_43_transpose_y_0"), val = tensor(false)]; tensor transpose_90_perm_0 = const()[name = tensor("transpose_90_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_91_perm_0 = const()[name = tensor("transpose_91_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_105 = transpose(perm = transpose_91_perm_0, x = k_87_cast); tensor transpose_106 = transpose(perm = transpose_90_perm_0, x = q_87_cast); tensor qk_43_cast = matmul(transpose_x = qk_43_transpose_x_0, transpose_y = qk_43_transpose_y_0, x = transpose_106, y = transpose_105); tensor var_2418_cast = softmax(axis = var_2353, x = qk_43_cast); tensor var_2420_transpose_x_0 = const()[name = tensor("op_2420_transpose_x_0"), val = tensor(false)]; tensor var_2420_transpose_y_0 = const()[name = tensor("op_2420_transpose_y_0"), val = tensor(false)]; tensor transpose_107 = transpose(perm = var_2414, x = var_2413_cast); tensor var_2420_cast = matmul(transpose_x = var_2420_transpose_x_0, transpose_y = var_2420_transpose_y_0, x = var_2418_cast, y = transpose_107); tensor var_2421 = const()[name = tensor("op_2421"), val = tensor([0, 2, 1, 3])]; tensor concat_21 = const()[name = tensor("concat_21"), val = tensor([1, 1500, 1024])]; tensor transpose_104 = transpose(perm = var_2421, x = var_2420_cast); tensor x_263_cast = reshape(shape = concat_21, x = transpose_104); tensor var_2426_to_fp16 = const()[name = tensor("op_2426_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(545224576)))]; tensor var_2427_to_fp16 = const()[name = tensor("op_2427_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547321792)))]; tensor var_2428_cast = linear(bias = var_2427_to_fp16, weight = var_2426_to_fp16, x = x_263_cast); tensor x_265_cast = add(x = x_259_cast, y = var_2428_cast); tensor var_2434_axes_0 = const()[name = tensor("op_2434_axes_0"), val = tensor([-1])]; tensor blocks_21_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_21_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547323904)))]; tensor blocks_21_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_21_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547326016)))]; tensor var_2434_cast = layer_norm(axes = var_2434_axes_0, beta = blocks_21_mlp_ln_bias_to_fp16, epsilon = var_2359_to_fp16, gamma = blocks_21_mlp_ln_weight_to_fp16, x = x_265_cast); tensor var_2443_to_fp16 = const()[name = tensor("op_2443_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(547328128)))]; tensor var_2444_to_fp16 = const()[name = tensor("op_2444_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(555716800)))]; tensor input_177_cast = linear(bias = var_2444_to_fp16, weight = var_2443_to_fp16, x = var_2434_cast); tensor x_269_mode_0 = const()[name = tensor("x_269_mode_0"), val = tensor("EXACT")]; tensor x_269_cast = gelu(mode = x_269_mode_0, x = input_177_cast); tensor var_2449_to_fp16 = const()[name = tensor("op_2449_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(555725056)))]; tensor var_2450_to_fp16 = const()[name = tensor("op_2450_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(564113728)))]; tensor var_2451_cast = linear(bias = var_2450_to_fp16, weight = var_2449_to_fp16, x = x_269_cast); tensor x_271_cast = add(x = x_265_cast, y = var_2451_cast); tensor var_2460 = const()[name = tensor("op_2460"), val = tensor(-1)]; tensor var_2477_axes_0 = const()[name = tensor("op_2477_axes_0"), val = tensor([-1])]; tensor blocks_22_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_22_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(564115840)))]; tensor blocks_22_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_22_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(564117952)))]; tensor var_2466_to_fp16 = const()[name = tensor("op_2466_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2477_cast = layer_norm(axes = var_2477_axes_0, beta = blocks_22_attn_ln_bias_to_fp16, epsilon = var_2466_to_fp16, gamma = blocks_22_attn_ln_weight_to_fp16, x = x_271_cast); tensor var_2488_to_fp16 = const()[name = tensor("op_2488_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(564120064)))]; tensor var_2489_to_fp16 = const()[name = tensor("op_2489_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(566217280)))]; tensor q_89_cast = linear(bias = var_2489_to_fp16, weight = var_2488_to_fp16, x = var_2477_cast); tensor var_2492_to_fp16 = const()[name = tensor("op_2492_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(566219392)))]; tensor k_89_bias_0_to_fp16 = const()[name = tensor("k_89_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(568316608)))]; tensor k_89_cast = linear(bias = k_89_bias_0_to_fp16, weight = var_2492_to_fp16, x = var_2477_cast); tensor var_2496_to_fp16 = const()[name = tensor("op_2496_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(568318720)))]; tensor var_2497_to_fp16 = const()[name = tensor("op_2497_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570415936)))]; tensor v_89_cast = linear(bias = var_2497_to_fp16, weight = var_2496_to_fp16, x = var_2477_cast); tensor var_2505 = const()[name = tensor("op_2505"), val = tensor([1, 1500, 16, -1])]; tensor var_2506_cast = reshape(shape = var_2505, x = q_89_cast); tensor const_212_to_fp16 = const()[name = tensor("const_212_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_91_cast = mul(x = var_2506_cast, y = const_212_to_fp16); tensor var_2512 = const()[name = tensor("op_2512"), val = tensor([1, 1500, 16, -1])]; tensor var_2513_cast = reshape(shape = var_2512, x = k_89_cast); tensor const_213_to_fp16 = const()[name = tensor("const_213_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_91_cast = mul(x = var_2513_cast, y = const_213_to_fp16); tensor var_2519 = const()[name = tensor("op_2519"), val = tensor([1, 1500, 16, -1])]; tensor var_2520_cast = reshape(shape = var_2519, x = v_89_cast); tensor var_2521 = const()[name = tensor("op_2521"), val = tensor([0, 2, 1, 3])]; tensor qk_45_transpose_x_0 = const()[name = tensor("qk_45_transpose_x_0"), val = tensor(false)]; tensor qk_45_transpose_y_0 = const()[name = tensor("qk_45_transpose_y_0"), val = tensor(false)]; tensor transpose_92_perm_0 = const()[name = tensor("transpose_92_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_93_perm_0 = const()[name = tensor("transpose_93_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_101 = transpose(perm = transpose_93_perm_0, x = k_91_cast); tensor transpose_102 = transpose(perm = transpose_92_perm_0, x = q_91_cast); tensor qk_45_cast = matmul(transpose_x = qk_45_transpose_x_0, transpose_y = qk_45_transpose_y_0, x = transpose_102, y = transpose_101); tensor var_2525_cast = softmax(axis = var_2460, x = qk_45_cast); tensor var_2527_transpose_x_0 = const()[name = tensor("op_2527_transpose_x_0"), val = tensor(false)]; tensor var_2527_transpose_y_0 = const()[name = tensor("op_2527_transpose_y_0"), val = tensor(false)]; tensor transpose_103 = transpose(perm = var_2521, x = var_2520_cast); tensor var_2527_cast = matmul(transpose_x = var_2527_transpose_x_0, transpose_y = var_2527_transpose_y_0, x = var_2525_cast, y = transpose_103); tensor var_2528 = const()[name = tensor("op_2528"), val = tensor([0, 2, 1, 3])]; tensor concat_22 = const()[name = tensor("concat_22"), val = tensor([1, 1500, 1024])]; tensor transpose_100 = transpose(perm = var_2528, x = var_2527_cast); tensor x_275_cast = reshape(shape = concat_22, x = transpose_100); tensor var_2533_to_fp16 = const()[name = tensor("op_2533_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(570418048)))]; tensor var_2534_to_fp16 = const()[name = tensor("op_2534_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572515264)))]; tensor var_2535_cast = linear(bias = var_2534_to_fp16, weight = var_2533_to_fp16, x = x_275_cast); tensor x_277_cast = add(x = x_271_cast, y = var_2535_cast); tensor var_2541_axes_0 = const()[name = tensor("op_2541_axes_0"), val = tensor([-1])]; tensor blocks_22_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_22_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572517376)))]; tensor blocks_22_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_22_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572519488)))]; tensor var_2541_cast = layer_norm(axes = var_2541_axes_0, beta = blocks_22_mlp_ln_bias_to_fp16, epsilon = var_2466_to_fp16, gamma = blocks_22_mlp_ln_weight_to_fp16, x = x_277_cast); tensor var_2550_to_fp16 = const()[name = tensor("op_2550_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(572521600)))]; tensor var_2551_to_fp16 = const()[name = tensor("op_2551_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(580910272)))]; tensor input_185_cast = linear(bias = var_2551_to_fp16, weight = var_2550_to_fp16, x = var_2541_cast); tensor x_281_mode_0 = const()[name = tensor("x_281_mode_0"), val = tensor("EXACT")]; tensor x_281_cast = gelu(mode = x_281_mode_0, x = input_185_cast); tensor var_2556_to_fp16 = const()[name = tensor("op_2556_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(580918528)))]; tensor var_2557_to_fp16 = const()[name = tensor("op_2557_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589307200)))]; tensor var_2558_cast = linear(bias = var_2557_to_fp16, weight = var_2556_to_fp16, x = x_281_cast); tensor x_283_cast = add(x = x_277_cast, y = var_2558_cast); tensor var_2567 = const()[name = tensor("op_2567"), val = tensor(-1)]; tensor var_2584_axes_0 = const()[name = tensor("op_2584_axes_0"), val = tensor([-1])]; tensor blocks_23_attn_ln_weight_to_fp16 = const()[name = tensor("blocks_23_attn_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589309312)))]; tensor blocks_23_attn_ln_bias_to_fp16 = const()[name = tensor("blocks_23_attn_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589311424)))]; tensor var_2573_to_fp16 = const()[name = tensor("op_2573_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2584_cast = layer_norm(axes = var_2584_axes_0, beta = blocks_23_attn_ln_bias_to_fp16, epsilon = var_2573_to_fp16, gamma = blocks_23_attn_ln_weight_to_fp16, x = x_283_cast); tensor var_2595_to_fp16 = const()[name = tensor("op_2595_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(589313536)))]; tensor var_2596_to_fp16 = const()[name = tensor("op_2596_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(591410752)))]; tensor q_93_cast = linear(bias = var_2596_to_fp16, weight = var_2595_to_fp16, x = var_2584_cast); tensor var_2599_to_fp16 = const()[name = tensor("op_2599_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(591412864)))]; tensor k_93_bias_0_to_fp16 = const()[name = tensor("k_93_bias_0_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(593510080)))]; tensor k_93_cast = linear(bias = k_93_bias_0_to_fp16, weight = var_2599_to_fp16, x = var_2584_cast); tensor var_2603_to_fp16 = const()[name = tensor("op_2603_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(593512192)))]; tensor var_2604_to_fp16 = const()[name = tensor("op_2604_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(595609408)))]; tensor v_93_cast = linear(bias = var_2604_to_fp16, weight = var_2603_to_fp16, x = var_2584_cast); tensor var_2612 = const()[name = tensor("op_2612"), val = tensor([1, 1500, 16, -1])]; tensor var_2613_cast = reshape(shape = var_2612, x = q_93_cast); tensor const_214_to_fp16 = const()[name = tensor("const_214_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor q_cast = mul(x = var_2613_cast, y = const_214_to_fp16); tensor var_2619 = const()[name = tensor("op_2619"), val = tensor([1, 1500, 16, -1])]; tensor var_2620_cast = reshape(shape = var_2619, x = k_93_cast); tensor const_215_to_fp16 = const()[name = tensor("const_215_to_fp16"), val = tensor([[[[0x1.6ap-2]]]])]; tensor k_cast = mul(x = var_2620_cast, y = const_215_to_fp16); tensor var_2626 = const()[name = tensor("op_2626"), val = tensor([1, 1500, 16, -1])]; tensor var_2627_cast = reshape(shape = var_2626, x = v_93_cast); tensor var_2628 = const()[name = tensor("op_2628"), val = tensor([0, 2, 1, 3])]; tensor qk_transpose_x_0 = const()[name = tensor("qk_transpose_x_0"), val = tensor(false)]; tensor qk_transpose_y_0 = const()[name = tensor("qk_transpose_y_0"), val = tensor(false)]; tensor transpose_94_perm_0 = const()[name = tensor("transpose_94_perm_0"), val = tensor([0, 2, 1, 3])]; tensor transpose_95_perm_0 = const()[name = tensor("transpose_95_perm_0"), val = tensor([0, 2, 3, 1])]; tensor transpose_97 = transpose(perm = transpose_95_perm_0, x = k_cast); tensor transpose_98 = transpose(perm = transpose_94_perm_0, x = q_cast); tensor qk_cast = matmul(transpose_x = qk_transpose_x_0, transpose_y = qk_transpose_y_0, x = transpose_98, y = transpose_97); tensor var_2632_cast = softmax(axis = var_2567, x = qk_cast); tensor var_2634_transpose_x_0 = const()[name = tensor("op_2634_transpose_x_0"), val = tensor(false)]; tensor var_2634_transpose_y_0 = const()[name = tensor("op_2634_transpose_y_0"), val = tensor(false)]; tensor transpose_99 = transpose(perm = var_2628, x = var_2627_cast); tensor var_2634_cast = matmul(transpose_x = var_2634_transpose_x_0, transpose_y = var_2634_transpose_y_0, x = var_2632_cast, y = transpose_99); tensor var_2635 = const()[name = tensor("op_2635"), val = tensor([0, 2, 1, 3])]; tensor concat_23 = const()[name = tensor("concat_23"), val = tensor([1, 1500, 1024])]; tensor transpose_96 = transpose(perm = var_2635, x = var_2634_cast); tensor x_287_cast = reshape(shape = concat_23, x = transpose_96); tensor var_2640_to_fp16 = const()[name = tensor("op_2640_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(595611520)))]; tensor var_2641_to_fp16 = const()[name = tensor("op_2641_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(597708736)))]; tensor var_2642_cast = linear(bias = var_2641_to_fp16, weight = var_2640_to_fp16, x = x_287_cast); tensor x_289_cast = add(x = x_283_cast, y = var_2642_cast); tensor var_2648_axes_0 = const()[name = tensor("op_2648_axes_0"), val = tensor([-1])]; tensor blocks_23_mlp_ln_weight_to_fp16 = const()[name = tensor("blocks_23_mlp_ln_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(597710848)))]; tensor blocks_23_mlp_ln_bias_to_fp16 = const()[name = tensor("blocks_23_mlp_ln_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(597712960)))]; tensor var_2648_cast = layer_norm(axes = var_2648_axes_0, beta = blocks_23_mlp_ln_bias_to_fp16, epsilon = var_2573_to_fp16, gamma = blocks_23_mlp_ln_weight_to_fp16, x = x_289_cast); tensor var_2657_to_fp16 = const()[name = tensor("op_2657_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(597715072)))]; tensor var_2658_to_fp16 = const()[name = tensor("op_2658_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(606103744)))]; tensor input_193_cast = linear(bias = var_2658_to_fp16, weight = var_2657_to_fp16, x = var_2648_cast); tensor x_293_mode_0 = const()[name = tensor("x_293_mode_0"), val = tensor("EXACT")]; tensor x_293_cast = gelu(mode = x_293_mode_0, x = input_193_cast); tensor var_2663_to_fp16 = const()[name = tensor("op_2663_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(606112000)))]; tensor var_2664_to_fp16 = const()[name = tensor("op_2664_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614500672)))]; tensor var_2665_cast = linear(bias = var_2664_to_fp16, weight = var_2663_to_fp16, x = x_293_cast); tensor x_cast = add(x = x_289_cast, y = var_2665_cast); tensor var_2678_axes_0 = const()[name = tensor("op_2678_axes_0"), val = tensor([-1])]; tensor ln_post_weight_to_fp16 = const()[name = tensor("ln_post_weight_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614502784)))]; tensor ln_post_bias_to_fp16 = const()[name = tensor("ln_post_bias_to_fp16"), val = tensor(BLOBFILE(path = tensor("@model_path/weights/weight.bin"), offset = tensor(614504896)))]; tensor var_2669_to_fp16 = const()[name = tensor("op_2669_to_fp16"), val = tensor(0x1.5p-17)]; tensor var_2678_cast = layer_norm(axes = var_2678_axes_0, beta = ln_post_bias_to_fp16, epsilon = var_2669_to_fp16, gamma = ln_post_weight_to_fp16, x = x_cast); tensor var_2678_cast_to_fp32_dtype_0 = const()[name = tensor("op_2678_cast_to_fp32_dtype_0"), val = tensor("fp32")]; tensor output = cast(dtype = var_2678_cast_to_fp32_dtype_0, x = var_2678_cast); } -> (output); }