[780764]: / src / train / train.sh

Download this file

35 lines (31 with data), 1.0 kB

 1
 2
 3
 4
 5
 6
 7
 8
 9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
#!/bin/bash
export PYTHONPATH=$(pwd)
script_dir=$(dirname "$0")
deepspeed --include localhost:0,1,2,3 $script_dir/train/train.py \
--deepspeed $script_dir/train/ds_zero2_no_offload.json \
--llm_pretrained_model_name_or_path lmsys/vicuna-7b-v1.5 \
--train_type train_both \
--use_lora True \
--lora_r 128 \
--lora_alpha 256 \
--vision_hidden_size 1027 \
--source joint_all \
--bf16 true \
--fp16 false \
--dataloader_pin_memory True \
--dataloader_num_workers 8 \
--dataloader_persistent_workers True \
--output_dir $script_dir/output/llemr_vicuna \
--num_train_epochs 5 \
--per_device_train_batch_size 4 \
--per_device_eval_batch_size 4 \
--gradient_accumulation_steps 8 \
--evaluation_strategy steps \
--eval_steps 0.05 \
--save_strategy steps \
--save_steps 0.05 \
--save_total_limit 4 \
--load_best_model_at_end True \
--run_name llemr_vicuna \
--learning_rate 1e-4 \
--logging_steps 1