JayceAnova commited on
Commit
1ff7e9f
·
verified ·
1 Parent(s): c3c1fb1

Update instruments_pretrain.sh

Browse files
Files changed (1) hide show
  1. instruments_pretrain.sh +9 -10
instruments_pretrain.sh CHANGED
@@ -2,34 +2,33 @@ export WANDB_MODE=disabled
2
  export CUDA_LAUNCH_BLOCKING=0
3
 
4
  DATASET=Instruments
5
- BASE_MODEL=/datain/v-yinju/llama-7b
6
- RQVAE_MODEL=/datain/v-yinju/rqvae-zzx/models/instruments/Apr-01-2024_01-25-11/best_collision_model.pth
7
- DATA_PATH=/datain/v-yinju/rqvae-zzx/data
8
- OUTPUT_DIR=/datain/v-yinju/rq-llama/v3-train/Instruments/CoT
9
 
10
  mkdir -p $OUTPUT_DIR
11
 
12
- torchrun --nproc_per_node=8 pre-train.py \
13
  --base_model $BASE_MODEL \
14
  --rqvae_model $RQVAE_MODEL \
15
  --output_dir $OUTPUT_DIR \
16
  --dataset $DATASET \
17
  --data_path $DATA_PATH \
18
- --per_device_batch_size 6 \
19
  --gradient_accumulation_steps 2 \
20
  --learning_rate 5e-4 \
21
  --model_max_length 1024 \
22
- --epochs 4 \
23
  --weight_decay 0.01 \
24
  --save_and_eval_strategy epoch \
25
- --fp16 \
26
- --deepspeed ./config/ds_z2_fp16.json \
27
  --dataloader_num_workers 4 \
28
  --only_train_response \
29
  --tasks seqrec,itemsearch,inters2title,inters2description,preferenceobtain,item2index,index2item,intertitles2item,query2item \
30
  --train_prompt_sample_num 1,1,1,1,1,1,1,1,1 \
31
  --train_data_sample_num 0,0,0,0,0,0,0,0,0 \
32
- --index_file /datain/v-yinju/rqvae-zzx/models/instruments/Apr-01-2024_01-25-11/indices.json
33
 
34
  cd convert
35
  nohup ./convert.sh $OUTPUT_DIR >convert.log 2>&1 &
 
2
  export CUDA_LAUNCH_BLOCKING=0
3
 
4
  DATASET=Instruments
5
+ BASE_MODEL=/home/jovyan/workspace/Llama-7b
6
+ RQVAE_MODEL=/home/jovyan/workspace/LC-Rec/index/Ins/Apr-04-2025_07-12-04/best_collision_model.pth
7
+ DATA_PATH=/home/jovyan/workspace
8
+ OUTPUT_DIR=./Ins
9
 
10
  mkdir -p $OUTPUT_DIR
11
 
12
+ torchrun --nproc_per_node=4 pre-train.py \
13
  --base_model $BASE_MODEL \
14
  --rqvae_model $RQVAE_MODEL \
15
  --output_dir $OUTPUT_DIR \
16
  --dataset $DATASET \
17
  --data_path $DATA_PATH \
18
+ --per_device_batch_size 8 \
19
  --gradient_accumulation_steps 2 \
20
  --learning_rate 5e-4 \
21
  --model_max_length 1024 \
22
+ --epochs 1 \
23
  --weight_decay 0.01 \
24
  --save_and_eval_strategy epoch \
25
+ --deepspeed ./config/ds_z2_bf16.json \
 
26
  --dataloader_num_workers 4 \
27
  --only_train_response \
28
  --tasks seqrec,itemsearch,inters2title,inters2description,preferenceobtain,item2index,index2item,intertitles2item,query2item \
29
  --train_prompt_sample_num 1,1,1,1,1,1,1,1,1 \
30
  --train_data_sample_num 0,0,0,0,0,0,0,0,0 \
31
+ --bf16 &>>$OUTPUT_DIR/log.txt
32
 
33
  cd convert
34
  nohup ./convert.sh $OUTPUT_DIR >convert.log 2>&1 &