Update instruments_pretrain.sh
Browse files- instruments_pretrain.sh +9 -10
instruments_pretrain.sh
CHANGED
|
@@ -2,34 +2,33 @@ export WANDB_MODE=disabled
|
|
| 2 |
export CUDA_LAUNCH_BLOCKING=0
|
| 3 |
|
| 4 |
DATASET=Instruments
|
| 5 |
-
BASE_MODEL=/
|
| 6 |
-
RQVAE_MODEL=/
|
| 7 |
-
DATA_PATH=/
|
| 8 |
-
OUTPUT_DIR
|
| 9 |
|
| 10 |
mkdir -p $OUTPUT_DIR
|
| 11 |
|
| 12 |
-
torchrun --nproc_per_node=
|
| 13 |
--base_model $BASE_MODEL \
|
| 14 |
--rqvae_model $RQVAE_MODEL \
|
| 15 |
--output_dir $OUTPUT_DIR \
|
| 16 |
--dataset $DATASET \
|
| 17 |
--data_path $DATA_PATH \
|
| 18 |
-
--per_device_batch_size
|
| 19 |
--gradient_accumulation_steps 2 \
|
| 20 |
--learning_rate 5e-4 \
|
| 21 |
--model_max_length 1024 \
|
| 22 |
-
--epochs
|
| 23 |
--weight_decay 0.01 \
|
| 24 |
--save_and_eval_strategy epoch \
|
| 25 |
-
--
|
| 26 |
-
--deepspeed ./config/ds_z2_fp16.json \
|
| 27 |
--dataloader_num_workers 4 \
|
| 28 |
--only_train_response \
|
| 29 |
--tasks seqrec,itemsearch,inters2title,inters2description,preferenceobtain,item2index,index2item,intertitles2item,query2item \
|
| 30 |
--train_prompt_sample_num 1,1,1,1,1,1,1,1,1 \
|
| 31 |
--train_data_sample_num 0,0,0,0,0,0,0,0,0 \
|
| 32 |
-
--
|
| 33 |
|
| 34 |
cd convert
|
| 35 |
nohup ./convert.sh $OUTPUT_DIR >convert.log 2>&1 &
|
|
|
|
| 2 |
export CUDA_LAUNCH_BLOCKING=0
|
| 3 |
|
| 4 |
DATASET=Instruments
|
| 5 |
+
BASE_MODEL=/home/jovyan/workspace/Llama-7b
|
| 6 |
+
RQVAE_MODEL=/home/jovyan/workspace/LC-Rec/index/Ins/Apr-04-2025_07-12-04/best_collision_model.pth
|
| 7 |
+
DATA_PATH=/home/jovyan/workspace
|
| 8 |
+
OUTPUT_DIR=./Ins
|
| 9 |
|
| 10 |
mkdir -p $OUTPUT_DIR
|
| 11 |
|
| 12 |
+
torchrun --nproc_per_node=4 pre-train.py \
|
| 13 |
--base_model $BASE_MODEL \
|
| 14 |
--rqvae_model $RQVAE_MODEL \
|
| 15 |
--output_dir $OUTPUT_DIR \
|
| 16 |
--dataset $DATASET \
|
| 17 |
--data_path $DATA_PATH \
|
| 18 |
+
--per_device_batch_size 8 \
|
| 19 |
--gradient_accumulation_steps 2 \
|
| 20 |
--learning_rate 5e-4 \
|
| 21 |
--model_max_length 1024 \
|
| 22 |
+
--epochs 1 \
|
| 23 |
--weight_decay 0.01 \
|
| 24 |
--save_and_eval_strategy epoch \
|
| 25 |
+
--deepspeed ./config/ds_z2_bf16.json \
|
|
|
|
| 26 |
--dataloader_num_workers 4 \
|
| 27 |
--only_train_response \
|
| 28 |
--tasks seqrec,itemsearch,inters2title,inters2description,preferenceobtain,item2index,index2item,intertitles2item,query2item \
|
| 29 |
--train_prompt_sample_num 1,1,1,1,1,1,1,1,1 \
|
| 30 |
--train_data_sample_num 0,0,0,0,0,0,0,0,0 \
|
| 31 |
+
--bf16 &>>$OUTPUT_DIR/log.txt
|
| 32 |
|
| 33 |
cd convert
|
| 34 |
nohup ./convert.sh $OUTPUT_DIR >convert.log 2>&1 &
|