Diff of /src/train/train.sh [000000] .. [780764]

Switch to side-by-side view

--- a
+++ b/src/train/train.sh
@@ -0,0 +1,34 @@
+#!/bin/bash
+
+export PYTHONPATH=$(pwd)
+
+script_dir=$(dirname "$0")
+
+deepspeed --include localhost:0,1,2,3 $script_dir/train/train.py \
+    --deepspeed $script_dir/train/ds_zero2_no_offload.json \
+    --llm_pretrained_model_name_or_path lmsys/vicuna-7b-v1.5 \
+    --train_type train_both \
+    --use_lora True \
+    --lora_r 128 \
+    --lora_alpha 256 \
+    --vision_hidden_size 1027 \
+    --source joint_all \
+    --bf16 true \
+    --fp16 false \
+    --dataloader_pin_memory True \
+    --dataloader_num_workers 8 \
+    --dataloader_persistent_workers True \
+    --output_dir $script_dir/output/llemr_vicuna \
+    --num_train_epochs 5 \
+    --per_device_train_batch_size 4 \
+    --per_device_eval_batch_size 4 \
+    --gradient_accumulation_steps 8 \
+    --evaluation_strategy steps \
+    --eval_steps 0.05 \
+    --save_strategy steps \
+    --save_steps 0.05 \
+    --save_total_limit 4 \
+    --load_best_model_at_end True \
+    --run_name llemr_vicuna \
+    --learning_rate 1e-4 \
+    --logging_steps 1