LLaMA-Factory/examples/full_multi_gpu/llama3_full_predict.yaml

### model
model_name_or_path: saves/llama3-8b/full/sft

### method
stage: sft
do_predict: true
finetuning_type: full

### dataset
dataset: identity,alpaca_en_demo
template: llama3
cutoff_len: 1024
max_samples: 50
overwrite_cache: true
preprocessing_num_workers: 16

### output
output_dir: saves/llama3-8b/full/predict
overwrite_output_dir: true

### eval
per_device_eval_batch_size: 1
predict_with_generate: true