eval.batch_size: 2 eval.cutoff_len: 1024 eval.dataset: - truth_dev_0716 eval.dataset_dir: data eval.max_new_tokens: 512 eval.max_samples: '100000' eval.output_dir: eval_2024-07-30-02-00-04_truthqa_bench1 eval.predict: true eval.temperature: 0.95 eval.top_p: 0.7 top.booster: auto top.checkpoint_path: train_2024-07-30-02-00-04_llama3.1_truthqa_bench_1 top.finetuning_type: full top.model_name: LLaMA3.1-8B-Chat top.quantization_bit: none top.quantization_method: bitsandbytes top.rope_scaling: none top.template: llama3 top.visual_inputs: false