LLaMA-Factory/examples/merge_lora/quantize.sh

11 lines
350 B
Bash
Raw Normal View History

2024-03-04 19:16:35 +00:00
#!/bin/bash
2024-03-07 12:26:31 +00:00
CUDA_VISIBLE_DEVICES=0 python ../../src/export_model.py \
2024-03-04 19:16:35 +00:00
--model_name_or_path ../../models/llama2-7b-sft \
--template default \
--export_dir ../../models/llama2-7b-sft-int4 \
--export_quantization_bit 4 \
--export_quantization_dataset ../../data/c4_demo.json \
--export_size 2 \
--export_legacy_format False